Spaces:
Sleeping
Sleeping
added vosk big but decided not to use it as its a little slow
Browse files- charles_actor.py +7 -4
- models/vosk/big/README +3 -0
- models/vosk/big/am/final.mdl +3 -0
- models/vosk/big/am/tree +3 -0
- models/vosk/big/conf/mfcc.conf +3 -0
- models/vosk/big/conf/model.conf +3 -0
- models/vosk/big/graph/HCLG.fst +3 -0
- models/vosk/big/graph/disambig_tid.int +3 -0
- models/vosk/big/graph/num_pdfs +3 -0
- models/vosk/big/graph/phones.txt +3 -0
- models/vosk/big/graph/phones/align_lexicon.int +3 -0
- models/vosk/big/graph/phones/align_lexicon.txt +3 -0
- models/vosk/big/graph/phones/disambig.int +3 -0
- models/vosk/big/graph/phones/disambig.txt +3 -0
- models/vosk/big/graph/phones/optional_silence.csl +3 -0
- models/vosk/big/graph/phones/optional_silence.int +3 -0
- models/vosk/big/graph/phones/optional_silence.txt +3 -0
- models/vosk/big/graph/phones/silence.csl +3 -0
- models/vosk/big/graph/phones/word_boundary.int +3 -0
- models/vosk/big/graph/phones/word_boundary.txt +3 -0
- models/vosk/big/graph/words.txt +3 -0
- models/vosk/big/ivector/final.dubm +3 -0
- models/vosk/big/ivector/final.ie +3 -0
- models/vosk/big/ivector/final.mat +3 -0
- models/vosk/big/ivector/global_cmvn.stats +3 -0
- models/vosk/big/ivector/online_cmvn.conf +0 -0
- models/vosk/big/ivector/splice.conf +3 -0
- models/vosk/big/rescore/G.carpa +3 -0
- models/vosk/big/rescore/G.fst +3 -0
- models/vosk/big/rnnlm/feat_embedding.final.mat +3 -0
- models/vosk/big/rnnlm/final.raw +3 -0
- models/vosk/big/rnnlm/special_symbol_opts.conf +3 -0
- models/vosk/big/rnnlm/special_symbol_opts.txt +3 -0
- models/vosk/big/rnnlm/word_feats.txt +3 -0
charles_actor.py
CHANGED
@@ -32,7 +32,8 @@ class CharlesActor:
|
|
32 |
|
33 |
print("002 - create SpeechToTextVoskActor")
|
34 |
from speech_to_text_vosk_actor import SpeechToTextVoskActor
|
35 |
-
self._speech_to_text_actor = SpeechToTextVoskActor.remote()
|
|
|
36 |
|
37 |
self._debug_queue = [
|
38 |
# "hello, how are you today?",
|
@@ -81,11 +82,13 @@ class CharlesActor:
|
|
81 |
prompt, speaker_finished, raw_json = await process_speech_to_text_future[0]
|
82 |
del process_speech_to_text_future[0]
|
83 |
|
84 |
-
|
|
|
|
|
85 |
print(f"Prompt: {prompt}")
|
86 |
-
system_one_audio_history.append("... " + str(raw_json))
|
87 |
system_one_audio_history.append(prompt)
|
88 |
-
|
89 |
system_one_audio_history = system_one_audio_history[-10:]
|
90 |
table_content = "| System 1 Audio History |\n| --- |\n"
|
91 |
table_content += "\n".join([f"| {item} |" for item in reversed(system_one_audio_history)])
|
|
|
32 |
|
33 |
print("002 - create SpeechToTextVoskActor")
|
34 |
from speech_to_text_vosk_actor import SpeechToTextVoskActor
|
35 |
+
self._speech_to_text_actor = SpeechToTextVoskActor.remote("small")
|
36 |
+
# self._speech_to_text_actor = SpeechToTextVoskActor.remote("big")
|
37 |
|
38 |
self._debug_queue = [
|
39 |
# "hello, how are you today?",
|
|
|
82 |
prompt, speaker_finished, raw_json = await process_speech_to_text_future[0]
|
83 |
del process_speech_to_text_future[0]
|
84 |
|
85 |
+
prompts_to_ignore = ["um", "uh", "ah", "huh", "hmm", "the", "but", "by", "just", "i'm"]
|
86 |
+
|
87 |
+
if speaker_finished and len(prompt) > 0 and prompt not in prompts_to_ignore:
|
88 |
print(f"Prompt: {prompt}")
|
89 |
+
# system_one_audio_history.append("... " + str(raw_json))
|
90 |
system_one_audio_history.append(prompt)
|
91 |
+
while len(system_one_audio_history) > 10:
|
92 |
system_one_audio_history = system_one_audio_history[-10:]
|
93 |
table_content = "| System 1 Audio History |\n| --- |\n"
|
94 |
table_content += "\n".join([f"| {item} |" for item in reversed(system_one_audio_history)])
|
models/vosk/big/README
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf64d215f247162ff03c8398e71c5ed6333bfd609d80c31f993f0154c7b13490
|
3 |
+
size 97
|
models/vosk/big/am/final.mdl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:589df479aa42a890fa59802d314e05a059723335fa9067ff7f7fdfe388458270
|
3 |
+
size 67711789
|
models/vosk/big/am/tree
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1eb0457adc4c8eb3edd7e4ea91e0a3b8f2663303c50b2fecb516e27f93e79b16
|
3 |
+
size 294384
|
models/vosk/big/conf/mfcc.conf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31dab8bb1dea9b33e039988ac079dfe5d50ebaa4a94826b9f9adc8fe84b147c6
|
3 |
+
size 128
|
models/vosk/big/conf/model.conf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5be64db91cc7895d29a61dafc88e61d7de9c2ffba9d2f7bffc0f16df02ece6aa
|
3 |
+
size 289
|
models/vosk/big/graph/HCLG.fst
ADDED
Git LFS Details
|
models/vosk/big/graph/disambig_tid.int
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3454708d21cb8fd5c99e13fed35591048307993d4b260a33809c54aa46902d0
|
3 |
+
size 114
|
models/vosk/big/graph/num_pdfs
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7926835a022549ce162c75b07cc0c791bb5e1692b5909c7b3ada025a6f10746
|
3 |
+
size 5
|
models/vosk/big/graph/phones.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bd58351c4b0b70a73a325e19d81c887075501e6c90989f8b5bdb8aa9bb96e7f
|
3 |
+
size 1478
|
models/vosk/big/graph/phones/align_lexicon.int
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c14886c64116cb89442c6e272a260daffd299c769315076b1578a4054f35a09e
|
3 |
+
size 9056865
|
models/vosk/big/graph/phones/align_lexicon.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17d4dfc455eba7793c9141c2206ab37ce79d4121893772173f4bdb5853f4b85f
|
3 |
+
size 12031033
|
models/vosk/big/graph/phones/disambig.int
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a3acf4669658d7b72feefa7d84cd3a9951250a6cbc52b68f50307d4fe6c930b
|
3 |
+
size 76
|
models/vosk/big/graph/phones/disambig.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72ea456cc53191f83b7ba5fce5a0445490bbaee1ee6d47c30a21b6617be9d7e3
|
3 |
+
size 66
|
models/vosk/big/graph/phones/optional_silence.csl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4355a46b19d348dc2f57c046f8ef63d4538ebb936000f3c9ee954a27460dd865
|
3 |
+
size 2
|
models/vosk/big/graph/phones/optional_silence.int
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4355a46b19d348dc2f57c046f8ef63d4538ebb936000f3c9ee954a27460dd865
|
3 |
+
size 2
|
models/vosk/big/graph/phones/optional_silence.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebe5d1c9a1dc955e8b0e9d16062b2d6fede3ba741afdb9a6aec65810009bee11
|
3 |
+
size 4
|
models/vosk/big/graph/phones/silence.csl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d99bf63ef15987b60950cfd42d9484d3a4b16e679cd355ac98b439bb8f16147
|
3 |
+
size 21
|
models/vosk/big/graph/phones/word_boundary.int
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da199d9c991e0e84681ddbb34627b915b26302d50a8fdaa23c51e2bc3a50b5c3
|
3 |
+
size 1761
|
models/vosk/big/graph/phones/word_boundary.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0e3a4a5e937b03cee32cd44b44ba3b73a08582ddbae0e4a877e4a214d0b8862
|
3 |
+
size 1977
|
models/vosk/big/graph/words.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bb92521362612633df1fb42ff903aff9b6211fc889f43eb27eb9d6117433321
|
3 |
+
size 3544135
|
models/vosk/big/ivector/final.dubm
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c5d7dd69d2122313baaf19f61f35dd3fa18b70c62ac0687e311e1c46e6daca7
|
3 |
+
size 168048
|
models/vosk/big/ivector/final.ie
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2940ab0a05b52495d651ff85723f1990479e962b77a9dc12071ba81e47930efd
|
3 |
+
size 9927287
|
models/vosk/big/ivector/final.mat
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddd83586dc5f928cda8738b922c85ffe38fc789cb5f9151a712ca12f37265382
|
3 |
+
size 44975
|
models/vosk/big/ivector/global_cmvn.stats
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33be09afcc80059847a275c3d043b51f1ab954c7c2438ddbbf4745e8ba144ff9
|
3 |
+
size 1080
|
models/vosk/big/ivector/online_cmvn.conf
ADDED
File without changes
|
models/vosk/big/ivector/splice.conf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f0c5f7c82d18eaf25d8bce470efa9f7741f88411fe428774bc0a9bb69a24756
|
3 |
+
size 35
|
models/vosk/big/rescore/G.carpa
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6af71f6138f2573f488bb45fb7927f2926412fd2aa4941e9d18ce60fd2cd57c0
|
3 |
+
size 1911931864
|
models/vosk/big/rescore/G.fst
ADDED
Git LFS Details
|
models/vosk/big/rnnlm/feat_embedding.final.mat
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66a1e6e59b7cede5f7c5775111bc44b4a6f3f95545bb82bd04ca63dd657a3a94
|
3 |
+
size 45152271
|
models/vosk/big/rnnlm/final.raw
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caafd73da01cfa73325db23c4b4e0f7784f2145f7ee3af48329f6b8aa94591da
|
3 |
+
size 135566398
|
models/vosk/big/rnnlm/special_symbol_opts.conf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:811293d8bab4fcbb2f126b0084bc9c6b12e8bbcefa16ffee2633465894565cfe
|
3 |
+
size 61
|
models/vosk/big/rnnlm/special_symbol_opts.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:845f515e4e049f069ef9977a072bf3c55522b8cae500f25e85b487a8af5892a4
|
3 |
+
size 61
|
models/vosk/big/rnnlm/word_feats.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70b7f13d68f11a32c0813caf63c49a64101005cf7544ecbac381bed86e36c7e4
|
3 |
+
size 43960911
|