sohojoe commited on
Commit
5ea3bc3
1 Parent(s): 6616951

added vosk big but decided not to use it as its a little slow

Browse files
Files changed (34) hide show
  1. charles_actor.py +7 -4
  2. models/vosk/big/README +3 -0
  3. models/vosk/big/am/final.mdl +3 -0
  4. models/vosk/big/am/tree +3 -0
  5. models/vosk/big/conf/mfcc.conf +3 -0
  6. models/vosk/big/conf/model.conf +3 -0
  7. models/vosk/big/graph/HCLG.fst +3 -0
  8. models/vosk/big/graph/disambig_tid.int +3 -0
  9. models/vosk/big/graph/num_pdfs +3 -0
  10. models/vosk/big/graph/phones.txt +3 -0
  11. models/vosk/big/graph/phones/align_lexicon.int +3 -0
  12. models/vosk/big/graph/phones/align_lexicon.txt +3 -0
  13. models/vosk/big/graph/phones/disambig.int +3 -0
  14. models/vosk/big/graph/phones/disambig.txt +3 -0
  15. models/vosk/big/graph/phones/optional_silence.csl +3 -0
  16. models/vosk/big/graph/phones/optional_silence.int +3 -0
  17. models/vosk/big/graph/phones/optional_silence.txt +3 -0
  18. models/vosk/big/graph/phones/silence.csl +3 -0
  19. models/vosk/big/graph/phones/word_boundary.int +3 -0
  20. models/vosk/big/graph/phones/word_boundary.txt +3 -0
  21. models/vosk/big/graph/words.txt +3 -0
  22. models/vosk/big/ivector/final.dubm +3 -0
  23. models/vosk/big/ivector/final.ie +3 -0
  24. models/vosk/big/ivector/final.mat +3 -0
  25. models/vosk/big/ivector/global_cmvn.stats +3 -0
  26. models/vosk/big/ivector/online_cmvn.conf +0 -0
  27. models/vosk/big/ivector/splice.conf +3 -0
  28. models/vosk/big/rescore/G.carpa +3 -0
  29. models/vosk/big/rescore/G.fst +3 -0
  30. models/vosk/big/rnnlm/feat_embedding.final.mat +3 -0
  31. models/vosk/big/rnnlm/final.raw +3 -0
  32. models/vosk/big/rnnlm/special_symbol_opts.conf +3 -0
  33. models/vosk/big/rnnlm/special_symbol_opts.txt +3 -0
  34. models/vosk/big/rnnlm/word_feats.txt +3 -0
charles_actor.py CHANGED
@@ -32,7 +32,8 @@ class CharlesActor:
32
 
33
  print("002 - create SpeechToTextVoskActor")
34
  from speech_to_text_vosk_actor import SpeechToTextVoskActor
35
- self._speech_to_text_actor = SpeechToTextVoskActor.remote()
 
36
 
37
  self._debug_queue = [
38
  # "hello, how are you today?",
@@ -81,11 +82,13 @@ class CharlesActor:
81
  prompt, speaker_finished, raw_json = await process_speech_to_text_future[0]
82
  del process_speech_to_text_future[0]
83
 
84
- if speaker_finished and len(prompt) > 0:
 
 
85
  print(f"Prompt: {prompt}")
86
- system_one_audio_history.append("... " + str(raw_json))
87
  system_one_audio_history.append(prompt)
88
- if len(system_one_audio_history) > 10:
89
  system_one_audio_history = system_one_audio_history[-10:]
90
  table_content = "| System 1 Audio History |\n| --- |\n"
91
  table_content += "\n".join([f"| {item} |" for item in reversed(system_one_audio_history)])
 
32
 
33
  print("002 - create SpeechToTextVoskActor")
34
  from speech_to_text_vosk_actor import SpeechToTextVoskActor
35
+ self._speech_to_text_actor = SpeechToTextVoskActor.remote("small")
36
+ # self._speech_to_text_actor = SpeechToTextVoskActor.remote("big")
37
 
38
  self._debug_queue = [
39
  # "hello, how are you today?",
 
82
  prompt, speaker_finished, raw_json = await process_speech_to_text_future[0]
83
  del process_speech_to_text_future[0]
84
 
85
+ prompts_to_ignore = ["um", "uh", "ah", "huh", "hmm", "the", "but", "by", "just", "i'm"]
86
+
87
+ if speaker_finished and len(prompt) > 0 and prompt not in prompts_to_ignore:
88
  print(f"Prompt: {prompt}")
89
+ # system_one_audio_history.append("... " + str(raw_json))
90
  system_one_audio_history.append(prompt)
91
+ while len(system_one_audio_history) > 10:
92
  system_one_audio_history = system_one_audio_history[-10:]
93
  table_content = "| System 1 Audio History |\n| --- |\n"
94
  table_content += "\n".join([f"| {item} |" for item in reversed(system_one_audio_history)])
models/vosk/big/README ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf64d215f247162ff03c8398e71c5ed6333bfd609d80c31f993f0154c7b13490
3
+ size 97
models/vosk/big/am/final.mdl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:589df479aa42a890fa59802d314e05a059723335fa9067ff7f7fdfe388458270
3
+ size 67711789
models/vosk/big/am/tree ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eb0457adc4c8eb3edd7e4ea91e0a3b8f2663303c50b2fecb516e27f93e79b16
3
+ size 294384
models/vosk/big/conf/mfcc.conf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31dab8bb1dea9b33e039988ac079dfe5d50ebaa4a94826b9f9adc8fe84b147c6
3
+ size 128
models/vosk/big/conf/model.conf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5be64db91cc7895d29a61dafc88e61d7de9c2ffba9d2f7bffc0f16df02ece6aa
3
+ size 289
models/vosk/big/graph/HCLG.fst ADDED

Git LFS Details

  • SHA256: 8403ad8c0160fb676ad6107b861f1af2cfdd1e4ee7074afec382a988bec713c0
  • Pointer size: 134 Bytes
  • Size of remote file: 174 MB
models/vosk/big/graph/disambig_tid.int ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3454708d21cb8fd5c99e13fed35591048307993d4b260a33809c54aa46902d0
3
+ size 114
models/vosk/big/graph/num_pdfs ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7926835a022549ce162c75b07cc0c791bb5e1692b5909c7b3ada025a6f10746
3
+ size 5
models/vosk/big/graph/phones.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bd58351c4b0b70a73a325e19d81c887075501e6c90989f8b5bdb8aa9bb96e7f
3
+ size 1478
models/vosk/big/graph/phones/align_lexicon.int ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c14886c64116cb89442c6e272a260daffd299c769315076b1578a4054f35a09e
3
+ size 9056865
models/vosk/big/graph/phones/align_lexicon.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17d4dfc455eba7793c9141c2206ab37ce79d4121893772173f4bdb5853f4b85f
3
+ size 12031033
models/vosk/big/graph/phones/disambig.int ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a3acf4669658d7b72feefa7d84cd3a9951250a6cbc52b68f50307d4fe6c930b
3
+ size 76
models/vosk/big/graph/phones/disambig.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72ea456cc53191f83b7ba5fce5a0445490bbaee1ee6d47c30a21b6617be9d7e3
3
+ size 66
models/vosk/big/graph/phones/optional_silence.csl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4355a46b19d348dc2f57c046f8ef63d4538ebb936000f3c9ee954a27460dd865
3
+ size 2
models/vosk/big/graph/phones/optional_silence.int ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4355a46b19d348dc2f57c046f8ef63d4538ebb936000f3c9ee954a27460dd865
3
+ size 2
models/vosk/big/graph/phones/optional_silence.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebe5d1c9a1dc955e8b0e9d16062b2d6fede3ba741afdb9a6aec65810009bee11
3
+ size 4
models/vosk/big/graph/phones/silence.csl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d99bf63ef15987b60950cfd42d9484d3a4b16e679cd355ac98b439bb8f16147
3
+ size 21
models/vosk/big/graph/phones/word_boundary.int ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da199d9c991e0e84681ddbb34627b915b26302d50a8fdaa23c51e2bc3a50b5c3
3
+ size 1761
models/vosk/big/graph/phones/word_boundary.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0e3a4a5e937b03cee32cd44b44ba3b73a08582ddbae0e4a877e4a214d0b8862
3
+ size 1977
models/vosk/big/graph/words.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bb92521362612633df1fb42ff903aff9b6211fc889f43eb27eb9d6117433321
3
+ size 3544135
models/vosk/big/ivector/final.dubm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c5d7dd69d2122313baaf19f61f35dd3fa18b70c62ac0687e311e1c46e6daca7
3
+ size 168048
models/vosk/big/ivector/final.ie ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2940ab0a05b52495d651ff85723f1990479e962b77a9dc12071ba81e47930efd
3
+ size 9927287
models/vosk/big/ivector/final.mat ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddd83586dc5f928cda8738b922c85ffe38fc789cb5f9151a712ca12f37265382
3
+ size 44975
models/vosk/big/ivector/global_cmvn.stats ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33be09afcc80059847a275c3d043b51f1ab954c7c2438ddbbf4745e8ba144ff9
3
+ size 1080
models/vosk/big/ivector/online_cmvn.conf ADDED
File without changes
models/vosk/big/ivector/splice.conf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f0c5f7c82d18eaf25d8bce470efa9f7741f88411fe428774bc0a9bb69a24756
3
+ size 35
models/vosk/big/rescore/G.carpa ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af71f6138f2573f488bb45fb7927f2926412fd2aa4941e9d18ce60fd2cd57c0
3
+ size 1911931864
models/vosk/big/rescore/G.fst ADDED

Git LFS Details

  • SHA256: 671ee718bf7666c8450483c0fbb78eeef111d487e2d7182c9214fdb2a4c96c46
  • Pointer size: 133 Bytes
  • Size of remote file: 37 MB
models/vosk/big/rnnlm/feat_embedding.final.mat ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66a1e6e59b7cede5f7c5775111bc44b4a6f3f95545bb82bd04ca63dd657a3a94
3
+ size 45152271
models/vosk/big/rnnlm/final.raw ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caafd73da01cfa73325db23c4b4e0f7784f2145f7ee3af48329f6b8aa94591da
3
+ size 135566398
models/vosk/big/rnnlm/special_symbol_opts.conf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:811293d8bab4fcbb2f126b0084bc9c6b12e8bbcefa16ffee2633465894565cfe
3
+ size 61
models/vosk/big/rnnlm/special_symbol_opts.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:845f515e4e049f069ef9977a072bf3c55522b8cae500f25e85b487a8af5892a4
3
+ size 61
models/vosk/big/rnnlm/word_feats.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b7f13d68f11a32c0813caf63c49a64101005cf7544ecbac381bed86e36c7e4
3
+ size 43960911