FarhadMadadzade's picture
weird
d14f075
raw
history blame
509 Bytes
from transformers import pipeline
import gradio as gr
import time
pipe = pipeline("automatic-speech-recognition", model="Artanis1551/whisper_romanian3")
def transcribe(audio, state=""):
text = pipe(audio)["text"]
print(text)
state += text + " "
return state, state
gr.Interface(
title="Romanian Speech Transcription",
fn=transcribe,
inputs=[gr.Audio(source="microphone", type="filepath", streaming=True), "state"],
outputs=["textbox", "state"],
live=True,
).launch()