WYCS2

Runtime error

App Files Files Community

RASMUS commited on Dec 20, 2022

Commit

10419a8

•

1 Parent(s): db0c1c9

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -8

app.py CHANGED Viewed

@@ -117,11 +117,12 @@ def speech_to_text(video_file_path, selected_source_lang, whisper_model):
     This space allows you to:
     1. Download youtube video with a given url
     2. Watch it in the first video component
-    3. Run automatic speech recognition on the video using Whisper
-    4. Translate the recognized transcriptions to Finnish, Swedish, Danish
     5. Burn the translations to the original video and watch the video in the 2nd video component
-    Speech Recognition is based on OpenAI Whisper https://github.com/openai/whisper
     """
     if(video_file_path == None):
@@ -308,14 +309,14 @@ with demo:
             ### This space allows you to:
             ##### 1. Download youtube video with a given URL
             ##### 2. Watch it in the first video component
-            ##### 3. Run automatic speech recognition on the video using Whisper (Please remember to select translation language)
-            ##### 4. Translate the recognized transcriptions to Finnish, Swedish, Danish
             ##### 5. Burn the translations to the original video and watch the video in the 2nd video component
             ''')
         with gr.Column():
             gr.Markdown('''
-            ### 1. Insert Youtube URL below (Some examples below which I suggest to use for first tests)
             ##### 1. https://www.youtube.com/watch?v=nlMuHtV82q8&ab_channel=NothingforSale24
             ##### 2. https://www.youtube.com/watch?v=JzPfMbG1vrE&ab_channel=ExplainerVideosByLauren
             ##### 3. https://www.youtube.com/watch?v=S68vvV0kod8&ab_channel=Pearl-CohnTelevision
@@ -336,7 +337,7 @@ with demo:
             with gr.Column():
                 gr.Markdown('''
                 ##### Here you can start the transcription and translation process.
-                ##### Be aware that processing will last for a while (35 second video took around 20 seconds in my testing and might fail for longer videos)
                 ''')
             selected_source_lang.render()
             selected_whisper_model.render()
@@ -357,7 +358,7 @@ with demo:
         with gr.Column():
             gr.Markdown('''
             ##### Here you will get translated transcriptions.
-            ##### Please remember to select Spoken Language and wanted translation language
             ##### ''')
             selected_translation_lang_2.render()
             translate_transcriptions_button = gr.Button("Step 3. Translate transcription")

     This space allows you to:
     1. Download youtube video with a given url
     2. Watch it in the first video component
+    3. Run automatic speech recognition on the video using fast Whisper models
+    4. Translate the recognized transcriptions to 26 languages supported by deepL
     5. Burn the translations to the original video and watch the video in the 2nd video component
+    Speech Recognition is based on models from OpenAI Whisper https://github.com/openai/whisper
+    This space is using c++ implementation by https://github.com/ggerganov/whisper.cpp
     """
     if(video_file_path == None):
             ### This space allows you to:
             ##### 1. Download youtube video with a given URL
             ##### 2. Watch it in the first video component
+            ##### 3. Run automatic speech recognition on the video using Whisper
+            ##### 4. Translate the recognized transcriptions to 26 languages supported by deepL
             ##### 5. Burn the translations to the original video and watch the video in the 2nd video component
             ''')
         with gr.Column():
             gr.Markdown('''
+            ### 1. Insert Youtube URL below. Some test videos below:
             ##### 1. https://www.youtube.com/watch?v=nlMuHtV82q8&ab_channel=NothingforSale24
             ##### 2. https://www.youtube.com/watch?v=JzPfMbG1vrE&ab_channel=ExplainerVideosByLauren
             ##### 3. https://www.youtube.com/watch?v=S68vvV0kod8&ab_channel=Pearl-CohnTelevision
             with gr.Column():
                 gr.Markdown('''
                 ##### Here you can start the transcription and translation process.
+                ##### Be aware that processing will last some time. With base model it is around 3x speed
                 ''')
             selected_source_lang.render()
             selected_whisper_model.render()
         with gr.Column():
             gr.Markdown('''
             ##### Here you will get translated transcriptions.
+            ##### Please remember to select target language
             ##### ''')
             selected_translation_lang_2.render()
             translate_transcriptions_button = gr.Button("Step 3. Translate transcription")