# HG changeset patch # User bgruening # Date 1713996603 0 # Node ID 2706ea308f941d88016cd075459a0e23b3b67b5a planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/whisper commit 65bc65452f0cb44220555d6295106ea525038c70 diff -r 000000000000 -r 2706ea308f94 test-data/english.wav Binary file test-data/english.wav has changed diff -r 000000000000 -r 2706ea308f94 test-data/german.wav Binary file test-data/german.wav has changed diff -r 000000000000 -r 2706ea308f94 test-data/german_english.mp3 Binary file test-data/german_english.mp3 has changed diff -r 000000000000 -r 2706ea308f94 test-data/persian.wav Binary file test-data/persian.wav has changed diff -r 000000000000 -r 2706ea308f94 test-data/transcribe.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transcribe.txt Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,2 @@ +21-year-old Jesus joined Manchester City last year in January 2017 from Brazilian club Paul Marius +for a reported fee of £27 million. diff -r 000000000000 -r 2706ea308f94 test-data/transcribe_english.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transcribe_english.json Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,1 @@ +{"text": " 21-year-old Jesus joined Manchester City last year in January 2017 from Brazilian club Paul Marius for a reported fee of \u00a327 million.", "segments": [{"id": 0, "seek": 0, "start": 0.0, "end": 9.8, "text": " 21-year-old Jesus joined Manchester City last year in January 2017 from Brazilian club Paul Marius", "tokens": [50364, 5080, 12, 5294, 12, 2641, 2705, 6869, 27180, 4392, 1036, 1064, 294, 7061, 6591, 490, 23435, 6482, 4552, 2039, 4872, 50854], "temperature": 0.0, "avg_logprob": -0.44505851409014535, "compression_ratio": 1.1166666666666667, "no_speech_prob": 0.045594051480293274}, {"id": 1, "seek": 0, "start": 9.8, "end": 12.4, "text": " for a reported fee of \u00a327 million.", "tokens": [50854, 337, 257, 7055, 12054, 295, 14378, 10076, 2459, 13, 50984], "temperature": 0.0, "avg_logprob": -0.44505851409014535, "compression_ratio": 1.1166666666666667, "no_speech_prob": 0.045594051480293274}], "language": "English"} \ No newline at end of file diff -r 000000000000 -r 2706ea308f94 test-data/transcribe_english.srt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transcribe_english.srt Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,8 @@ +1 +00:00:00,000 --> 00:00:09,800 +21-year-old Jesus joined Manchester City last year in January 2017 from Brazilian club Paul Marius + +2 +00:00:09,800 --> 00:00:12,400 +for a reported fee of £27 million. + diff -r 000000000000 -r 2706ea308f94 test-data/transcribe_english.tsv --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transcribe_english.tsv Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,3 @@ +start end text +0 9800 21-year-old Jesus joined Manchester City last year in January 2017 from Brazilian club Paul Marius +9800 12400 for a reported fee of £27 million. diff -r 000000000000 -r 2706ea308f94 test-data/transcribe_german.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transcribe_german.txt Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,2 @@ +Reitschafte es New Zealand's A1 GP Auto Black Beauty sieben Mal mit Geschwindigkeiten von +über 160 kmh über die Brücke zu fahren. diff -r 000000000000 -r 2706ea308f94 test-data/transcribe_german_english.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transcribe_german_english.txt Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,6 @@ +Der gewünschte Gesprächspartner ist zurzeit nicht erreichbar, +wird aber per SMS über Ihren Anruf informiert. +Vielen Dank. +The person you have called is currently not available. +However, he will be informed about your call attempt via SMS. +Thank you for calling. diff -r 000000000000 -r 2706ea308f94 test-data/transcribe_persian.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transcribe_persian.json Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,1 @@ +{"text": " \u0628\u0631\u062e\u06cc \u0627\u0632 \u0627\u06cc\u0646 \u0633\u0646\u06af \u0647\u0627 \u06a9\u0647 \u062f\u0631 \u06a9\u0648\u0631\u06cc \u0632\u0645\u06cc\u0646 \u062e\u06cc\u0644\u06cc \u0646\u0627\u062f\u0631 \u0647\u0633\u062a\u0646\u062f \u0628\u0627 \u0642\u06cc\u0645\u062a\u06cc \u0627\u0632 \u06cc\u0627\u0632\u062f\u0647 \u0647\u0632\u0627\u0631 \u062f\u0648\u0644\u0627\u0631 \u062a\u0627 \u0628\u06cc\u0633\u062a\u0648 \u062f\u0648 \u0647\u0632\u0627\u0631 \u0648 \u067e\u0646\u0633\u062a\u062f \u062f\u0648\u0644\u0627\u0631 \u062f\u0631 \u0647\u0631 \u0627\u0648\u0646\u0633 \u0641\u0631\u0648\u062e\u062a \u0645\u06cc \u0634\u0628\u0646\u062f \u06a9\u0647 \u0686\u06cc\u0632 \u062d\u062f\u0648\u062f \u062f\u0647 \u0628\u0631\u0627\u0628\u0631 \u0642\u06cc\u0645\u062a \u062a\u0644\u0627\u0633\u062a.", "segments": [{"id": 0, "seek": 0, "start": 0.0, "end": 13.42, "text": " \u0628\u0631\u062e\u06cc \u0627\u0632 \u0627\u06cc\u0646 \u0633\u0646\u06af \u0647\u0627 \u06a9\u0647 \u062f\u0631 \u06a9\u0648\u0631\u06cc \u0632\u0645\u06cc\u0646 \u062e\u06cc\u0644\u06cc \u0646\u0627\u062f\u0631 \u0647\u0633\u062a\u0646\u062f \u0628\u0627 \u0642\u06cc\u0645\u062a\u06cc \u0627\u0632 \u06cc\u0627\u0632\u062f\u0647 \u0647\u0632\u0627\u0631 \u062f\u0648\u0644\u0627\u0631 \u062a\u0627 \u0628\u06cc\u0633\u062a\u0648 \u062f\u0648 \u0647\u0632\u0627\u0631 \u0648 \u067e\u0646\u0633\u062a\u062f \u062f\u0648\u0644\u0627\u0631 \u062f\u0631 \u0647\u0631 \u0627\u0648\u0646\u0633 \u0641\u0631\u0648\u062e\u062a \u0645\u06cc \u0634\u0628\u0646\u062f \u06a9\u0647 \u0686\u06cc\u0632 \u062d\u062f\u0648\u062f \u062f\u0647 \u0628\u0631\u0627\u0628\u0631 \u0642\u06cc\u0645\u062a \u062a\u0644\u0627\u0633\u062a.", "tokens": [50364, 4724, 2288, 9778, 4135, 1975, 11622, 1975, 32151, 8608, 1863, 16761, 8032, 995, 7565, 3224, 11778, 2288, 7565, 13063, 4135, 30767, 2304, 32151, 16490, 4135, 1211, 4135, 8717, 18513, 2288, 8032, 14851, 41260, 4724, 995, 12174, 4135, 2304, 2655, 4135, 1975, 11622, 25429, 31377, 3215, 3224, 8032, 11622, 9640, 11778, 12610, 9640, 6055, 995, 4724, 4135, 14851, 2407, 11778, 2407, 8032, 11622, 9640, 4032, 21453, 1863, 14851, 3215, 11778, 12610, 9640, 11778, 2288, 8032, 2288, 1975, 11536, 3794, 6156, 32887, 46456, 48478, 13412, 3555, 41260, 7565, 3224, 34766, 4135, 11622, 11331, 3215, 23328, 11778, 3224, 4724, 2288, 16758, 2288, 12174, 4135, 2304, 2655, 6055, 15040, 14851, 13, 51064], "temperature": 0.0, "avg_logprob": -0.19529172723943536, "compression_ratio": 1.7426900584795322, "no_speech_prob": 0.08913763612508774, "words": [{"word": " \u0628\u0631\u062e\u06cc", "start": 0.0, "end": 1.42, "probability": 0.9033132642507553}, {"word": " \u0627\u0632", "start": 1.42, "end": 1.62, "probability": 0.9889343976974487}, {"word": " \u0627\u06cc\u0646", "start": 1.62, "end": 1.74, "probability": 0.9703238010406494}, {"word": " \u0633\u0646\u06af", "start": 1.74, "end": 2.12, "probability": 0.9526320497194926}, {"word": " \u0647\u0627", "start": 2.12, "end": 2.3, "probability": 0.7875397503376007}, {"word": " \u06a9\u0647", "start": 2.3, "end": 2.42, "probability": 0.9241614937782288}, {"word": " \u062f\u0631", "start": 2.42, "end": 2.64, "probability": 0.9900502860546112}, {"word": " \u06a9\u0648\u0631\u06cc", "start": 2.64, "end": 2.9, "probability": 0.6278652548789978}, {"word": " \u0632\u0645\u06cc\u0646", "start": 2.9, "end": 3.28, "probability": 0.9571676055590311}, {"word": " \u062e\u06cc\u0644\u06cc", "start": 3.28, "end": 3.66, "probability": 0.9876178354024887}, {"word": " \u0646\u0627\u062f\u0631", "start": 3.66, "end": 4.02, "probability": 0.9114052851994833}, {"word": " \u0647\u0633\u062a\u0646\u062f", "start": 4.02, "end": 4.5, "probability": 0.7521352767944336}, {"word": " \u0628\u0627", "start": 4.5, "end": 4.74, "probability": 0.7534557282924652}, {"word": " \u0642\u06cc\u0645\u062a\u06cc", "start": 4.74, "end": 5.26, "probability": 0.8726431250572204}, {"word": " \u0627\u0632", "start": 5.26, "end": 5.42, "probability": 0.984766036272049}, {"word": " \u06cc\u0627\u0632\u062f\u0647", "start": 5.42, "end": 5.92, "probability": 0.7151797562837601}, {"word": " \u0647\u0632\u0627\u0631", "start": 5.92, "end": 6.3, "probability": 0.9623414278030396}, {"word": " \u062f\u0648\u0644\u0627\u0631", "start": 6.3, "end": 6.9, "probability": 0.9146908124287924}, {"word": " \u062a\u0627", "start": 6.9, "end": 7.2, "probability": 0.9085398316383362}, {"word": " \u0628\u06cc\u0633\u062a\u0648", "start": 7.2, "end": 7.6, "probability": 0.8677552342414856}, {"word": " \u062f\u0648", "start": 7.6, "end": 7.7, "probability": 0.9638055264949799}, {"word": " \u0647\u0632\u0627\u0631", "start": 7.7, "end": 7.98, "probability": 0.9253919919331869}, {"word": " \u0648", "start": 7.98, "end": 8.12, "probability": 0.7168136835098267}, {"word": " \u067e\u0646\u0633\u062a\u062f", "start": 8.12, "end": 8.54, "probability": 0.7954745143651962}, {"word": " \u062f\u0648\u0644\u0627\u0631", "start": 8.54, "end": 8.92, "probability": 0.9934115409851074}, {"word": " \u062f\u0631", "start": 8.92, "end": 9.2, "probability": 0.9842988848686218}, {"word": " \u0647\u0631", "start": 9.2, "end": 9.34, "probability": 0.9502557218074799}, {"word": " \u0627\u0648\u0646\u0633", "start": 9.34, "end": 9.62, "probability": 0.6762789487838745}, {"word": " \u0641\u0631\u0648\u062e\u062a", "start": 9.62, "end": 9.98, "probability": 0.9117981791496277}, {"word": " \u0645\u06cc", "start": 9.98, "end": 10.14, "probability": 0.7245240807533264}, {"word": " \u0634\u0628\u0646\u062f", "start": 10.14, "end": 10.7, "probability": 0.6922649443149567}, {"word": " \u06a9\u0647", "start": 10.7, "end": 11.04, "probability": 0.899426281452179}, {"word": " \u0686\u06cc\u0632", "start": 11.04, "end": 11.32, "probability": 0.9809092283248901}, {"word": " \u062d\u062f\u0648\u062f", "start": 11.32, "end": 11.68, "probability": 0.8215810457865397}, {"word": " \u062f\u0647", "start": 11.68, "end": 11.98, "probability": 0.889119029045105}, {"word": " \u0628\u0631\u0627\u0628\u0631", "start": 11.98, "end": 12.4, "probability": 0.9024366587400436}, {"word": " \u0642\u06cc\u0645\u062a", "start": 12.4, "end": 12.84, "probability": 0.9782368242740631}, {"word": " \u062a\u0644\u0627\u0633\u062a.", "start": 12.84, "end": 13.42, "probability": 0.6221214731534322}]}], "language": "Persian"} \ No newline at end of file diff -r 000000000000 -r 2706ea308f94 whisper.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/whisper.xml Wed Apr 24 22:10:03 2024 +0000 @@ -0,0 +1,358 @@ + + + Transcribe audio or video files to text using the OpenAI Whisper + + + 20231117 + 0 + + + quay.io/galaxy/whisper:20231117 + + + + + + 1 + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ + + 'txt' in output_format + + + 'json' in output_format + + + 'srt' in output_format + + + 'vtt' in output_format + + + 'tsv' in output_format + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + +
+ + + + + + + + + + + + + + +
+
+ `_. + +Usage +..... + + +**Input** +Audio or video file to transcribe in one of wav, mp3, mkv, flv, mpg, ogg, wma, or mp4. + + +**Output** +Transcribed text in the selected format. The output can be in text, JSON, SubRip, WebVTT, or tab-separated values (tabular) format. + ]]> + + + + + + @misc{openai2022whisper, + title={Whisper}, + author={OpenAI}, + year={2022}, + url={https://github.com/openai/whisper} + } + + +