Spaces:

Siddhant
/

Voice_Assistant

Sleeping

Siddhant commited on Sep 8

Commit

ef3e243

•

1 Parent(s): 4ba2ab9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -48,7 +48,7 @@ user_role = "user"
 tts_model = TTS(language="EN_NEWEST", device="auto")
 speaker_id = tts_model.hps.data.spk2id["EN-Newest"]
 blocksize = 512
-transcriber = pipeline("automatic-speech-recognition", model="distil-whisper/distil-large-v3")
 def int2float(sound):
     """
     Taken from https://github.com/snakers4/silero-vad
@@ -71,7 +71,7 @@ max_speech_ms=float("inf")
 #     "distil-whisper/distil-large-v3",
 #     torch_dtype="float16",
 # ).to("cpu")
-LM_tokenizer = AutoTokenizer.from_pretrained("HuggingFaceTB/SmolLM-360M-Instruct")
 LM_model = AutoModelForCausalLM.from_pretrained(
     "HuggingFaceTB/SmolLM-360M-Instruct", torch_dtype="float16", trust_remote_code=True
 ).to("cpu")

 tts_model = TTS(language="EN_NEWEST", device="auto")
 speaker_id = tts_model.hps.data.spk2id["EN-Newest"]
 blocksize = 512
+transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-tiny.en")
 def int2float(sound):
     """
     Taken from https://github.com/snakers4/silero-vad
 #     "distil-whisper/distil-large-v3",
 #     torch_dtype="float16",
 # ).to("cpu")
+LM_tokenizer = AutoTokenizer.from_pretrained("HuggingFaceTB/SmolLM-135M-Instruct")
 LM_model = AutoModelForCausalLM.from_pretrained(
     "HuggingFaceTB/SmolLM-360M-Instruct", torch_dtype="float16", trust_remote_code=True
 ).to("cpu")