File size: 996 Bytes
28a9108
 
 
 
 
 
 
 
 
 
 
 
 
3a4433a
 
 
28a9108
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3a4433a
28a9108
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
# pip install ffmpeg ffprobe
import os
import gradio as gr
from transformers import pipeline
from transformers import WhisperProcessor
pipe = pipeline(task="automatic-speech-recognition", model="openai/whisper-tiny")
processor = WhisperProcessor.from_pretrained("openai/whisper-tiny")
pipe.model.config.forced_decoder_ids = processor.get_decoder_prompt_ids(language="english", task="transcribe")




def recognize(input_audio):
    # print('?????????-------------')
    # print(type(input_audio))
    # print(input_audio)
    output_text = pipe(input_audio)['text']
    return output_text





with gr.Blocks() as demo:
    gr.Markdown("""
                """)
    # 录音功能
    input_audio = gr.Audio(source="microphone", type="filepath", label='Audio')

    audio_button = gr.Button(value="Recognize!")
    text = gr.Textbox(lines=2, label='你要不要看看你说了啥???')
    audio_button.click(recognize, inputs=[input_audio], outputs=[text],api_name='predict')


demo.launch()