whisper_fileStream / streaming.py
mskov's picture
Duplicate from mskov/whisper_stream
c8eb530
raw
history blame
459 Bytes
from transformers import pipeline
import gradio as gr
import time
p = pipeline("automatic-speech-recognition")
def transcribe(audio, state=""):
time.sleep(1)
text = p(audio)["text"]
state += text + " "
return state, state
gr.Interface(
fn=transcribe,
inputs=[
gr.inputs.Audio(source="microphone", type="filepath"),
"state"
],
outputs=[
"textbox",
"state"
],
live=True).launch()