README.md CHANGED
@@ -1,55 +1,11 @@
1
  ---
2
  license: cc-by-nc-4.0
3
- library_name: chat_tts
4
- pipeline_tag: text-to-audio
5
  ---
6
 
 
7
 
8
- **We are also training larger-scale models and need computational power and data support. If you can provide assistance, please contact [email protected]. Thank you very much.**
9
 
10
- ## Clone the Repository
11
- First, clone the Git repository:
12
- ```bash
13
- git clone https://github.com/2noise/ChatTTS.git
14
- ```
15
 
16
- ## Model Inference
17
-
18
-
19
- ```python
20
- # Import necessary libraries and configure settings
21
- import torch
22
- import torchaudio
23
- torch._dynamo.config.cache_size_limit = 64
24
- torch._dynamo.config.suppress_errors = True
25
- torch.set_float32_matmul_precision('high')
26
-
27
- import ChatTTS
28
- from IPython.display import Audio
29
-
30
- # Initialize and load the model:
31
- chat = ChatTTS.Chat()
32
- chat.load_models(compile=False) # Set to True for better performance
33
-
34
- # Define the text input for inference (Support Batching)
35
- texts = [
36
- "So we found being competitive and collaborative was a huge way of staying motivated towards our goals, so one person to call when you fall off, one person who gets you back on then one person to actually do the activity with.",
37
- ]
38
-
39
- # Perform inference and play the generated audio
40
- wavs = chat.infer(texts)
41
- Audio(wavs[0], rate=24_000, autoplay=True)
42
-
43
- # Save the generated audio
44
- torchaudio.save("output.wav", torch.from_numpy(wavs[0]), 24000)
45
- ```
46
- **For more usage examples, please refer to the [example notebook](https://github.com/2noise/ChatTTS/blob/main/example.ipynb), which includes parameters for finer control over the generated speech, such as specifying the speaker, adjusting speech speed, and adding laughter.**
47
-
48
-
49
-
50
-
51
-
52
-
53
- ### Disclaimer: For Academic Purposes Only
54
-
55
- The information provided in this document is for academic purposes only. It is intended for educational and research use, and should not be used for any commercial or legal purposes. The authors do not guarantee the accuracy, completeness, or reliability of the information.
 
1
  ---
2
  license: cc-by-nc-4.0
 
 
3
  ---
4
 
5
+ Disclaimer: For Academic Purposes Only
6
 
7
+ The information provided in this document is for academic purposes only. It is intended for educational and research use, and should not be used for any commercial or legal purposes. The authors do not guarantee the accuracy, completeness, or reliability of the information.
8
 
9
+ 免责声明:仅供学术交流
 
 
 
 
10
 
11
+ 本文件中的信息仅供学术交流使用。其目的是用于教育和研究,不得用于任何商业或法律目的。作者不保证信息的准确性、完整性或可靠性。
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
asset/DVAE.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d0b044a8368c0513100a2eca98456b289e6be6a18b7a63be1bcaa315ea874d9
3
- size 60359112
 
 
 
 
asset/DVAE_full.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:553eb75763511e23f3e5f86303e2163c5ca775489d637fb635d979c8ae58bbe5
3
- size 60402442
 
 
 
 
asset/Decoder.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:77aa55e0a977949c4733df3c6f876fa85860d3298cba63295a7bc6901729d4e0
3
- size 103694920
 
 
 
 
asset/Embed.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ff0be7134934155741b643b74e32fb6bf3eec41257984459b2ed60cdb4c48b0
3
- size 145598536
 
 
 
 
asset/Vocos.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:07e5561491cce41f7f90cfdb94b2ff263ff5742c3d89339db99b17ad82cc3f44
3
- size 54348240
 
 
 
 
asset/gpt/config.json DELETED
@@ -1,33 +0,0 @@
1
- {
2
- "architectures": [
3
- "LlamaModel"
4
- ],
5
- "attention_bias": false,
6
- "attention_dropout": 0.0,
7
- "bos_token_id": 1,
8
- "eos_token_id": 2,
9
- "hidden_act": "silu",
10
- "hidden_size": 768,
11
- "initializer_range": 0.02,
12
- "intermediate_size": 3072,
13
- "max_position_embeddings": 4096,
14
- "mlp_bias": false,
15
- "model_type": "llama",
16
- "num_attention_heads": 12,
17
- "num_audio_tokens": 626,
18
- "num_hidden_layers": 20,
19
- "num_key_value_heads": 12,
20
- "num_text_tokens": 21178,
21
- "num_vq": 4,
22
- "pretraining_tp": 1,
23
- "rms_norm_eps": 1e-06,
24
- "rope_scaling": null,
25
- "rope_theta": 10000.0,
26
- "spk_KL": false,
27
- "spk_emb_dim": 192,
28
- "tie_word_embeddings": false,
29
- "torch_dtype": "float32",
30
- "transformers_version": "4.41.2",
31
- "use_cache": false,
32
- "vocab_size": 32000
33
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
asset/gpt/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd0806fd971f52f6a22c923ec64982b305e817bcc41ca83417fcf9141b984a0f
3
- size 853423872
 
 
 
 
asset/tokenizer/special_tokens_map.json DELETED
@@ -1,389 +0,0 @@
1
- {
2
- "additional_special_tokens": [
3
- {
4
- "content": "[Sasr]",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false
9
- },
10
- {
11
- "content": "[Pasr]",
12
- "lstrip": false,
13
- "normalized": false,
14
- "rstrip": false,
15
- "single_word": false
16
- },
17
- {
18
- "content": "[Easr]",
19
- "lstrip": false,
20
- "normalized": false,
21
- "rstrip": false,
22
- "single_word": false
23
- },
24
- {
25
- "content": "[Stts]",
26
- "lstrip": false,
27
- "normalized": false,
28
- "rstrip": false,
29
- "single_word": false
30
- },
31
- {
32
- "content": "[Ptts]",
33
- "lstrip": false,
34
- "normalized": false,
35
- "rstrip": false,
36
- "single_word": false
37
- },
38
- {
39
- "content": "[Etts]",
40
- "lstrip": false,
41
- "normalized": false,
42
- "rstrip": false,
43
- "single_word": false
44
- },
45
- {
46
- "content": "[Sbreak]",
47
- "lstrip": false,
48
- "normalized": false,
49
- "rstrip": false,
50
- "single_word": false
51
- },
52
- {
53
- "content": "[Pbreak]",
54
- "lstrip": false,
55
- "normalized": false,
56
- "rstrip": false,
57
- "single_word": false
58
- },
59
- {
60
- "content": "[Ebreak]",
61
- "lstrip": false,
62
- "normalized": false,
63
- "rstrip": false,
64
- "single_word": false
65
- },
66
- {
67
- "content": "[uv_break]",
68
- "lstrip": false,
69
- "normalized": false,
70
- "rstrip": false,
71
- "single_word": false
72
- },
73
- {
74
- "content": "[v_break]",
75
- "lstrip": false,
76
- "normalized": false,
77
- "rstrip": false,
78
- "single_word": false
79
- },
80
- {
81
- "content": "[lbreak]",
82
- "lstrip": false,
83
- "normalized": false,
84
- "rstrip": false,
85
- "single_word": false
86
- },
87
- {
88
- "content": "[llbreak]",
89
- "lstrip": false,
90
- "normalized": false,
91
- "rstrip": false,
92
- "single_word": false
93
- },
94
- {
95
- "content": "[undefine]",
96
- "lstrip": false,
97
- "normalized": false,
98
- "rstrip": false,
99
- "single_word": false
100
- },
101
- {
102
- "content": "[laugh]",
103
- "lstrip": false,
104
- "normalized": false,
105
- "rstrip": false,
106
- "single_word": false
107
- },
108
- {
109
- "content": "[spk_emb]",
110
- "lstrip": false,
111
- "normalized": false,
112
- "rstrip": false,
113
- "single_word": false
114
- },
115
- {
116
- "content": "[empty_spk]",
117
- "lstrip": false,
118
- "normalized": false,
119
- "rstrip": false,
120
- "single_word": false
121
- },
122
- {
123
- "content": "[music]",
124
- "lstrip": false,
125
- "normalized": false,
126
- "rstrip": false,
127
- "single_word": false
128
- },
129
- {
130
- "content": "[pure]",
131
- "lstrip": false,
132
- "normalized": false,
133
- "rstrip": false,
134
- "single_word": false
135
- },
136
- {
137
- "content": "[break_0]",
138
- "lstrip": false,
139
- "normalized": false,
140
- "rstrip": false,
141
- "single_word": false
142
- },
143
- {
144
- "content": "[break_1]",
145
- "lstrip": false,
146
- "normalized": false,
147
- "rstrip": false,
148
- "single_word": false
149
- },
150
- {
151
- "content": "[break_2]",
152
- "lstrip": false,
153
- "normalized": false,
154
- "rstrip": false,
155
- "single_word": false
156
- },
157
- {
158
- "content": "[break_3]",
159
- "lstrip": false,
160
- "normalized": false,
161
- "rstrip": false,
162
- "single_word": false
163
- },
164
- {
165
- "content": "[break_4]",
166
- "lstrip": false,
167
- "normalized": false,
168
- "rstrip": false,
169
- "single_word": false
170
- },
171
- {
172
- "content": "[break_5]",
173
- "lstrip": false,
174
- "normalized": false,
175
- "rstrip": false,
176
- "single_word": false
177
- },
178
- {
179
- "content": "[break_6]",
180
- "lstrip": false,
181
- "normalized": false,
182
- "rstrip": false,
183
- "single_word": false
184
- },
185
- {
186
- "content": "[break_7]",
187
- "lstrip": false,
188
- "normalized": false,
189
- "rstrip": false,
190
- "single_word": false
191
- },
192
- {
193
- "content": "[laugh_0]",
194
- "lstrip": false,
195
- "normalized": false,
196
- "rstrip": false,
197
- "single_word": false
198
- },
199
- {
200
- "content": "[laugh_1]",
201
- "lstrip": false,
202
- "normalized": false,
203
- "rstrip": false,
204
- "single_word": false
205
- },
206
- {
207
- "content": "[laugh_2]",
208
- "lstrip": false,
209
- "normalized": false,
210
- "rstrip": false,
211
- "single_word": false
212
- },
213
- {
214
- "content": "[oral_0]",
215
- "lstrip": false,
216
- "normalized": false,
217
- "rstrip": false,
218
- "single_word": false
219
- },
220
- {
221
- "content": "[oral_1]",
222
- "lstrip": false,
223
- "normalized": false,
224
- "rstrip": false,
225
- "single_word": false
226
- },
227
- {
228
- "content": "[oral_2]",
229
- "lstrip": false,
230
- "normalized": false,
231
- "rstrip": false,
232
- "single_word": false
233
- },
234
- {
235
- "content": "[oral_3]",
236
- "lstrip": false,
237
- "normalized": false,
238
- "rstrip": false,
239
- "single_word": false
240
- },
241
- {
242
- "content": "[oral_4]",
243
- "lstrip": false,
244
- "normalized": false,
245
- "rstrip": false,
246
- "single_word": false
247
- },
248
- {
249
- "content": "[oral_5]",
250
- "lstrip": false,
251
- "normalized": false,
252
- "rstrip": false,
253
- "single_word": false
254
- },
255
- {
256
- "content": "[oral_6]",
257
- "lstrip": false,
258
- "normalized": false,
259
- "rstrip": false,
260
- "single_word": false
261
- },
262
- {
263
- "content": "[oral_7]",
264
- "lstrip": false,
265
- "normalized": false,
266
- "rstrip": false,
267
- "single_word": false
268
- },
269
- {
270
- "content": "[oral_8]",
271
- "lstrip": false,
272
- "normalized": false,
273
- "rstrip": false,
274
- "single_word": false
275
- },
276
- {
277
- "content": "[oral_9]",
278
- "lstrip": false,
279
- "normalized": false,
280
- "rstrip": false,
281
- "single_word": false
282
- },
283
- {
284
- "content": "[speed_0]",
285
- "lstrip": false,
286
- "normalized": false,
287
- "rstrip": false,
288
- "single_word": false
289
- },
290
- {
291
- "content": "[speed_1]",
292
- "lstrip": false,
293
- "normalized": false,
294
- "rstrip": false,
295
- "single_word": false
296
- },
297
- {
298
- "content": "[speed_2]",
299
- "lstrip": false,
300
- "normalized": false,
301
- "rstrip": false,
302
- "single_word": false
303
- },
304
- {
305
- "content": "[speed_3]",
306
- "lstrip": false,
307
- "normalized": false,
308
- "rstrip": false,
309
- "single_word": false
310
- },
311
- {
312
- "content": "[speed_4]",
313
- "lstrip": false,
314
- "normalized": false,
315
- "rstrip": false,
316
- "single_word": false
317
- },
318
- {
319
- "content": "[speed_5]",
320
- "lstrip": false,
321
- "normalized": false,
322
- "rstrip": false,
323
- "single_word": false
324
- },
325
- {
326
- "content": "[speed_6]",
327
- "lstrip": false,
328
- "normalized": false,
329
- "rstrip": false,
330
- "single_word": false
331
- },
332
- {
333
- "content": "[speed_7]",
334
- "lstrip": false,
335
- "normalized": false,
336
- "rstrip": false,
337
- "single_word": false
338
- },
339
- {
340
- "content": "[speed_8]",
341
- "lstrip": false,
342
- "normalized": false,
343
- "rstrip": false,
344
- "single_word": false
345
- },
346
- {
347
- "content": "[speed_9]",
348
- "lstrip": false,
349
- "normalized": false,
350
- "rstrip": false,
351
- "single_word": false
352
- }
353
- ],
354
- "cls_token": {
355
- "content": "[CLS]",
356
- "lstrip": false,
357
- "normalized": false,
358
- "rstrip": false,
359
- "single_word": false
360
- },
361
- "mask_token": {
362
- "content": "[MASK]",
363
- "lstrip": false,
364
- "normalized": false,
365
- "rstrip": false,
366
- "single_word": false
367
- },
368
- "pad_token": {
369
- "content": "[PAD]",
370
- "lstrip": false,
371
- "normalized": false,
372
- "rstrip": false,
373
- "single_word": false
374
- },
375
- "sep_token": {
376
- "content": "[SEP]",
377
- "lstrip": false,
378
- "normalized": false,
379
- "rstrip": false,
380
- "single_word": false
381
- },
382
- "unk_token": {
383
- "content": "[UNK]",
384
- "lstrip": false,
385
- "normalized": false,
386
- "rstrip": false,
387
- "single_word": false
388
- }
389
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
asset/tokenizer/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
asset/tokenizer/tokenizer_config.json DELETED
@@ -1,516 +0,0 @@
1
- {
2
- "added_tokens_decoder": {
3
- "0": {
4
- "content": "[PAD]",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false,
9
- "special": true
10
- },
11
- "100": {
12
- "content": "[UNK]",
13
- "lstrip": false,
14
- "normalized": false,
15
- "rstrip": false,
16
- "single_word": false,
17
- "special": true
18
- },
19
- "101": {
20
- "content": "[CLS]",
21
- "lstrip": false,
22
- "normalized": false,
23
- "rstrip": false,
24
- "single_word": false,
25
- "special": true
26
- },
27
- "102": {
28
- "content": "[SEP]",
29
- "lstrip": false,
30
- "normalized": false,
31
- "rstrip": false,
32
- "single_word": false,
33
- "special": true
34
- },
35
- "103": {
36
- "content": "[MASK]",
37
- "lstrip": false,
38
- "normalized": false,
39
- "rstrip": false,
40
- "single_word": false,
41
- "special": true
42
- },
43
- "21128": {
44
- "content": "[Sasr]",
45
- "lstrip": false,
46
- "normalized": false,
47
- "rstrip": false,
48
- "single_word": false,
49
- "special": true
50
- },
51
- "21129": {
52
- "content": "[Pasr]",
53
- "lstrip": false,
54
- "normalized": false,
55
- "rstrip": false,
56
- "single_word": false,
57
- "special": true
58
- },
59
- "21130": {
60
- "content": "[Easr]",
61
- "lstrip": false,
62
- "normalized": false,
63
- "rstrip": false,
64
- "single_word": false,
65
- "special": true
66
- },
67
- "21131": {
68
- "content": "[Stts]",
69
- "lstrip": false,
70
- "normalized": false,
71
- "rstrip": false,
72
- "single_word": false,
73
- "special": true
74
- },
75
- "21132": {
76
- "content": "[Ptts]",
77
- "lstrip": false,
78
- "normalized": false,
79
- "rstrip": false,
80
- "single_word": false,
81
- "special": true
82
- },
83
- "21133": {
84
- "content": "[Etts]",
85
- "lstrip": false,
86
- "normalized": false,
87
- "rstrip": false,
88
- "single_word": false,
89
- "special": true
90
- },
91
- "21134": {
92
- "content": "[Sbreak]",
93
- "lstrip": false,
94
- "normalized": false,
95
- "rstrip": false,
96
- "single_word": false,
97
- "special": true
98
- },
99
- "21135": {
100
- "content": "[Pbreak]",
101
- "lstrip": false,
102
- "normalized": false,
103
- "rstrip": false,
104
- "single_word": false,
105
- "special": true
106
- },
107
- "21136": {
108
- "content": "[Ebreak]",
109
- "lstrip": false,
110
- "normalized": false,
111
- "rstrip": false,
112
- "single_word": false,
113
- "special": true
114
- },
115
- "21137": {
116
- "content": "[uv_break]",
117
- "lstrip": false,
118
- "normalized": false,
119
- "rstrip": false,
120
- "single_word": false,
121
- "special": true
122
- },
123
- "21138": {
124
- "content": "[v_break]",
125
- "lstrip": false,
126
- "normalized": false,
127
- "rstrip": false,
128
- "single_word": false,
129
- "special": true
130
- },
131
- "21139": {
132
- "content": "[lbreak]",
133
- "lstrip": false,
134
- "normalized": false,
135
- "rstrip": false,
136
- "single_word": false,
137
- "special": true
138
- },
139
- "21140": {
140
- "content": "[llbreak]",
141
- "lstrip": false,
142
- "normalized": false,
143
- "rstrip": false,
144
- "single_word": false,
145
- "special": true
146
- },
147
- "21141": {
148
- "content": "[undefine]",
149
- "lstrip": false,
150
- "normalized": false,
151
- "rstrip": false,
152
- "single_word": false,
153
- "special": true
154
- },
155
- "21142": {
156
- "content": "[laugh]",
157
- "lstrip": false,
158
- "normalized": false,
159
- "rstrip": false,
160
- "single_word": false,
161
- "special": true
162
- },
163
- "21143": {
164
- "content": "[spk_emb]",
165
- "lstrip": false,
166
- "normalized": false,
167
- "rstrip": false,
168
- "single_word": false,
169
- "special": true
170
- },
171
- "21144": {
172
- "content": "[empty_spk]",
173
- "lstrip": false,
174
- "normalized": false,
175
- "rstrip": false,
176
- "single_word": false,
177
- "special": true
178
- },
179
- "21145": {
180
- "content": "[music]",
181
- "lstrip": false,
182
- "normalized": false,
183
- "rstrip": false,
184
- "single_word": false,
185
- "special": true
186
- },
187
- "21146": {
188
- "content": "[pure]",
189
- "lstrip": false,
190
- "normalized": false,
191
- "rstrip": false,
192
- "single_word": false,
193
- "special": true
194
- },
195
- "21147": {
196
- "content": "[break_0]",
197
- "lstrip": false,
198
- "normalized": false,
199
- "rstrip": false,
200
- "single_word": false,
201
- "special": true
202
- },
203
- "21148": {
204
- "content": "[break_1]",
205
- "lstrip": false,
206
- "normalized": false,
207
- "rstrip": false,
208
- "single_word": false,
209
- "special": true
210
- },
211
- "21149": {
212
- "content": "[break_2]",
213
- "lstrip": false,
214
- "normalized": false,
215
- "rstrip": false,
216
- "single_word": false,
217
- "special": true
218
- },
219
- "21150": {
220
- "content": "[break_3]",
221
- "lstrip": false,
222
- "normalized": false,
223
- "rstrip": false,
224
- "single_word": false,
225
- "special": true
226
- },
227
- "21151": {
228
- "content": "[break_4]",
229
- "lstrip": false,
230
- "normalized": false,
231
- "rstrip": false,
232
- "single_word": false,
233
- "special": true
234
- },
235
- "21152": {
236
- "content": "[break_5]",
237
- "lstrip": false,
238
- "normalized": false,
239
- "rstrip": false,
240
- "single_word": false,
241
- "special": true
242
- },
243
- "21153": {
244
- "content": "[break_6]",
245
- "lstrip": false,
246
- "normalized": false,
247
- "rstrip": false,
248
- "single_word": false,
249
- "special": true
250
- },
251
- "21154": {
252
- "content": "[break_7]",
253
- "lstrip": false,
254
- "normalized": false,
255
- "rstrip": false,
256
- "single_word": false,
257
- "special": true
258
- },
259
- "21155": {
260
- "content": "[laugh_0]",
261
- "lstrip": false,
262
- "normalized": false,
263
- "rstrip": false,
264
- "single_word": false,
265
- "special": true
266
- },
267
- "21156": {
268
- "content": "[laugh_1]",
269
- "lstrip": false,
270
- "normalized": false,
271
- "rstrip": false,
272
- "single_word": false,
273
- "special": true
274
- },
275
- "21157": {
276
- "content": "[laugh_2]",
277
- "lstrip": false,
278
- "normalized": false,
279
- "rstrip": false,
280
- "single_word": false,
281
- "special": true
282
- },
283
- "21158": {
284
- "content": "[oral_0]",
285
- "lstrip": false,
286
- "normalized": false,
287
- "rstrip": false,
288
- "single_word": false,
289
- "special": true
290
- },
291
- "21159": {
292
- "content": "[oral_1]",
293
- "lstrip": false,
294
- "normalized": false,
295
- "rstrip": false,
296
- "single_word": false,
297
- "special": true
298
- },
299
- "21160": {
300
- "content": "[oral_2]",
301
- "lstrip": false,
302
- "normalized": false,
303
- "rstrip": false,
304
- "single_word": false,
305
- "special": true
306
- },
307
- "21161": {
308
- "content": "[oral_3]",
309
- "lstrip": false,
310
- "normalized": false,
311
- "rstrip": false,
312
- "single_word": false,
313
- "special": true
314
- },
315
- "21162": {
316
- "content": "[oral_4]",
317
- "lstrip": false,
318
- "normalized": false,
319
- "rstrip": false,
320
- "single_word": false,
321
- "special": true
322
- },
323
- "21163": {
324
- "content": "[oral_5]",
325
- "lstrip": false,
326
- "normalized": false,
327
- "rstrip": false,
328
- "single_word": false,
329
- "special": true
330
- },
331
- "21164": {
332
- "content": "[oral_6]",
333
- "lstrip": false,
334
- "normalized": false,
335
- "rstrip": false,
336
- "single_word": false,
337
- "special": true
338
- },
339
- "21165": {
340
- "content": "[oral_7]",
341
- "lstrip": false,
342
- "normalized": false,
343
- "rstrip": false,
344
- "single_word": false,
345
- "special": true
346
- },
347
- "21166": {
348
- "content": "[oral_8]",
349
- "lstrip": false,
350
- "normalized": false,
351
- "rstrip": false,
352
- "single_word": false,
353
- "special": true
354
- },
355
- "21167": {
356
- "content": "[oral_9]",
357
- "lstrip": false,
358
- "normalized": false,
359
- "rstrip": false,
360
- "single_word": false,
361
- "special": true
362
- },
363
- "21168": {
364
- "content": "[speed_0]",
365
- "lstrip": false,
366
- "normalized": false,
367
- "rstrip": false,
368
- "single_word": false,
369
- "special": true
370
- },
371
- "21169": {
372
- "content": "[speed_1]",
373
- "lstrip": false,
374
- "normalized": false,
375
- "rstrip": false,
376
- "single_word": false,
377
- "special": true
378
- },
379
- "21170": {
380
- "content": "[speed_2]",
381
- "lstrip": false,
382
- "normalized": false,
383
- "rstrip": false,
384
- "single_word": false,
385
- "special": true
386
- },
387
- "21171": {
388
- "content": "[speed_3]",
389
- "lstrip": false,
390
- "normalized": false,
391
- "rstrip": false,
392
- "single_word": false,
393
- "special": true
394
- },
395
- "21172": {
396
- "content": "[speed_4]",
397
- "lstrip": false,
398
- "normalized": false,
399
- "rstrip": false,
400
- "single_word": false,
401
- "special": true
402
- },
403
- "21173": {
404
- "content": "[speed_5]",
405
- "lstrip": false,
406
- "normalized": false,
407
- "rstrip": false,
408
- "single_word": false,
409
- "special": true
410
- },
411
- "21174": {
412
- "content": "[speed_6]",
413
- "lstrip": false,
414
- "normalized": false,
415
- "rstrip": false,
416
- "single_word": false,
417
- "special": true
418
- },
419
- "21175": {
420
- "content": "[speed_7]",
421
- "lstrip": false,
422
- "normalized": false,
423
- "rstrip": false,
424
- "single_word": false,
425
- "special": true
426
- },
427
- "21176": {
428
- "content": "[speed_8]",
429
- "lstrip": false,
430
- "normalized": false,
431
- "rstrip": false,
432
- "single_word": false,
433
- "special": true
434
- },
435
- "21177": {
436
- "content": "[speed_9]",
437
- "lstrip": false,
438
- "normalized": false,
439
- "rstrip": false,
440
- "single_word": false,
441
- "special": true
442
- }
443
- },
444
- "additional_special_tokens": [
445
- "[Sasr]",
446
- "[Pasr]",
447
- "[Easr]",
448
- "[Stts]",
449
- "[Ptts]",
450
- "[Etts]",
451
- "[Sbreak]",
452
- "[Pbreak]",
453
- "[Ebreak]",
454
- "[uv_break]",
455
- "[v_break]",
456
- "[lbreak]",
457
- "[llbreak]",
458
- "[undefine]",
459
- "[laugh]",
460
- "[spk_emb]",
461
- "[empty_spk]",
462
- "[music]",
463
- "[pure]",
464
- "[break_0]",
465
- "[break_1]",
466
- "[break_2]",
467
- "[break_3]",
468
- "[break_4]",
469
- "[break_5]",
470
- "[break_6]",
471
- "[break_7]",
472
- "[laugh_0]",
473
- "[laugh_1]",
474
- "[laugh_2]",
475
- "[oral_0]",
476
- "[oral_1]",
477
- "[oral_2]",
478
- "[oral_3]",
479
- "[oral_4]",
480
- "[oral_5]",
481
- "[oral_6]",
482
- "[oral_7]",
483
- "[oral_8]",
484
- "[oral_9]",
485
- "[speed_0]",
486
- "[speed_1]",
487
- "[speed_2]",
488
- "[speed_3]",
489
- "[speed_4]",
490
- "[speed_5]",
491
- "[speed_6]",
492
- "[speed_7]",
493
- "[speed_8]",
494
- "[speed_9]"
495
- ],
496
- "clean_up_tokenization_spaces": true,
497
- "cls_token": "[CLS]",
498
- "do_basic_tokenize": true,
499
- "do_lower_case": true,
500
- "mask_token": "[MASK]",
501
- "max_length": 256,
502
- "model_max_length": 1000000000000000019884624838656,
503
- "never_split": null,
504
- "pad_to_multiple_of": null,
505
- "pad_token": "[PAD]",
506
- "pad_token_type_id": 0,
507
- "padding_side": "right",
508
- "sep_token": "[SEP]",
509
- "stride": 0,
510
- "strip_accents": null,
511
- "tokenize_chinese_chars": true,
512
- "tokenizer_class": "BertTokenizer",
513
- "truncation_side": "right",
514
- "truncation_strategy": "longest_first",
515
- "unk_token": "[UNK]"
516
- }