Mahadev Ratheesh
commited on
Commit
•
feaf1a9
1
Parent(s):
9ea8a98
Upload tokenizer
Browse files- tokenizer_config.json +0 -1
- vocab.json +1 -1
tokenizer_config.json
CHANGED
@@ -39,7 +39,6 @@
|
|
39 |
"eos_token": "</s>",
|
40 |
"model_max_length": 1000000000000000019884624838656,
|
41 |
"pad_token": "[PAD]",
|
42 |
-
"processor_class": "Wav2Vec2BertProcessor",
|
43 |
"replace_word_delimiter_char": " ",
|
44 |
"target_lang": null,
|
45 |
"tokenizer_class": "Wav2Vec2CTCTokenizer",
|
|
|
39 |
"eos_token": "</s>",
|
40 |
"model_max_length": 1000000000000000019884624838656,
|
41 |
"pad_token": "[PAD]",
|
|
|
42 |
"replace_word_delimiter_char": " ",
|
43 |
"target_lang": null,
|
44 |
"tokenizer_class": "Wav2Vec2CTCTokenizer",
|
vocab.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
" ": 0,
|
3 |
"[PAD]": 70,
|
4 |
"[UNK]": 69,
|
|
|
5 |
"ം": 1,
|
6 |
"ഃ": 2,
|
7 |
"അ": 3,
|
|
|
1 |
{
|
|
|
2 |
"[PAD]": 70,
|
3 |
"[UNK]": 69,
|
4 |
+
"|": 0,
|
5 |
"ം": 1,
|
6 |
"ഃ": 2,
|
7 |
"അ": 3,
|