Mahadev Ratheesh commited on
Commit
feaf1a9
1 Parent(s): 9ea8a98

Upload tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer_config.json +0 -1
  2. vocab.json +1 -1
tokenizer_config.json CHANGED
@@ -39,7 +39,6 @@
39
  "eos_token": "</s>",
40
  "model_max_length": 1000000000000000019884624838656,
41
  "pad_token": "[PAD]",
42
- "processor_class": "Wav2Vec2BertProcessor",
43
  "replace_word_delimiter_char": " ",
44
  "target_lang": null,
45
  "tokenizer_class": "Wav2Vec2CTCTokenizer",
 
39
  "eos_token": "</s>",
40
  "model_max_length": 1000000000000000019884624838656,
41
  "pad_token": "[PAD]",
 
42
  "replace_word_delimiter_char": " ",
43
  "target_lang": null,
44
  "tokenizer_class": "Wav2Vec2CTCTokenizer",
vocab.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- " ": 0,
3
  "[PAD]": 70,
4
  "[UNK]": 69,
 
5
  "ം": 1,
6
  "ഃ": 2,
7
  "അ": 3,
 
1
  {
 
2
  "[PAD]": 70,
3
  "[UNK]": 69,
4
+ "|": 0,
5
  "ം": 1,
6
  "ഃ": 2,
7
  "അ": 3,