|
import transformers |
|
from transformers import pipeline |
|
import gradio as gr |
|
import os |
|
import sys |
|
os.system("pip install evaluate") |
|
os.system("pip install datasets") |
|
from evaluate import evaluator |
|
from datasets import load_dataset |
|
|
|
p = pipeline("automatic-speech-recognition") |
|
|
|
def transcribe(audio, state=""): |
|
text = p(audio)["text"] |
|
state += text + " " |
|
return state, state |
|
|
|
gr.Interface( |
|
fn=transcribe, |
|
inputs=[ |
|
gr.Audio(source="microphone", type="filepath", streaming=True), |
|
"state" |
|
], |
|
outputs=[ |
|
"textbox", |
|
"state" |
|
], |
|
live=True).launch() |
|
|