Spaces:

aichina
/

youtube-whisper-09

Sleeping

App Files Files Community

aichina commited on Feb 21, 2023

Commit

0c9ce61

•

1 Parent(s): 6e941de

v5

Browse files

Files changed (1) hide show

app.py +3 -25

app.py CHANGED Viewed

@@ -29,7 +29,7 @@ def get_audio(url):
     print('aodio over ..')
     return audio_file
-def get_transcript(url, model_size, lang, format):
     audio_file = get_audio(url)
     audio_file = 'tmp.mp4'
     files = {
@@ -43,24 +43,7 @@ def get_transcript(url, model_size, lang, format):
-def format_to_srt(segments):
-    output = ""
-    for i, segment in enumerate(segments):
-        output += f"{i + 1}\n"
-        output += f"{format_timestamp(segment['start'])} --> {format_timestamp(segment['end'])}\n"
-        output += f"{segment['text']}\n\n"
-    return output
-def format_timestamp(t):
-    hh = t//3600
-    mm = (t - hh*3600)//60
-    ss = t - hh*3600 - mm*60
-    mi = (t - int(t))*1000
-    return f"{int(hh):02d}:{int(mm):02d}:{int(ss):02d},{int(mi):03d}"
-langs = ["None"] + sorted(list(whisper.tokenizer.LANGUAGES.values()))
-model_size = list(whisper._MODELS.keys())
 with gr.Blocks() as demo:
@@ -70,12 +53,7 @@ with gr.Blocks() as demo:
             with gr.Row():
                 url = gr.Textbox(placeholder='Youtube video URL', label='URL')
-            with gr.Row():
-                model_size = gr.Dropdown(choices=model_size, value='tiny', label="Model")
-                lang = gr.Dropdown(choices=langs, value="None", label="Language (Optional)")
-                format = gr.Dropdown(choices=["None", ".srt"], value="None", label="Timestamps? (Optional)")
             with gr.Row():
                 gr.Markdown("Larger models are more accurate, but slower. For 1min video, it'll take ~30s (tiny), ~1min (base), ~3min (small), ~5min (medium), etc.")
@@ -84,6 +62,6 @@ with gr.Blocks() as demo:
         with gr.Column():
             outputs = gr.Textbox(placeholder='Transcription of the video', label='Transcription')
-    transcribe_btn.click(get_transcript, inputs=[url, model_size, lang, format], outputs=outputs)
 demo.launch(debug=True)

     print('aodio over ..')
     return audio_file
+def get_transcript(url):
     audio_file = get_audio(url)
     audio_file = 'tmp.mp4'
     files = {
 with gr.Blocks() as demo:
             with gr.Row():
                 url = gr.Textbox(placeholder='Youtube video URL', label='URL')
             with gr.Row():
                 gr.Markdown("Larger models are more accurate, but slower. For 1min video, it'll take ~30s (tiny), ~1min (base), ~3min (small), ~5min (medium), etc.")
         with gr.Column():
             outputs = gr.Textbox(placeholder='Transcription of the video', label='Transcription')
+    transcribe_btn.click(get_transcript, inputs=[url], outputs=outputs)
 demo.launch(debug=True)