f77777 commited on
Commit
e63d13d
1 Parent(s): 946f19d

Upload tokenizer

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. vocab.json +60 -60
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
  license: apache-2.0
3
- base_model: facebook/wav2vec2-large-xlsr-53
4
  tags:
5
  - generated_from_trainer
 
6
  datasets:
7
  - common_voice_13_0
8
  model-index:
 
1
  ---
2
  license: apache-2.0
 
3
  tags:
4
  - generated_from_trainer
5
+ base_model: facebook/wav2vec2-large-xlsr-53
6
  datasets:
7
  - common_voice_13_0
8
  model-index:
vocab.json CHANGED
@@ -1,64 +1,64 @@
1
  {
2
  "[PAD]": 61,
3
  "[UNK]": 60,
4
- "|": 20,
5
- "ँ": 47,
6
- "ं": 34,
7
- "ः": 31,
8
- "अ": 9,
9
- "आ": 49,
10
- "इ": 50,
11
- "ई": 24,
12
- "उ": 58,
13
- "ऊ": 48,
14
- "ए": 17,
15
- "ओ": 38,
16
- "औ": 1,
17
- "क": 28,
18
- "ख": 26,
19
- "ग": 41,
20
- "घ": 51,
21
- "ङ": 15,
22
- "च": 35,
23
- "छ": 42,
24
- "ज": 25,
25
- "झ": 55,
26
- "ञ": 57,
27
- "ट": 8,
28
- "ठ": 11,
29
- "ड": 10,
30
- "ढ": 7,
31
- "ण": 16,
32
- "त": 21,
33
- "थ": 2,
34
- "द": 36,
35
- "ध": 39,
36
- "न": 30,
37
- "प": 56,
38
- "फ": 44,
39
- "ब": 13,
40
- "भ": 43,
41
- "म": 22,
42
- "य": 14,
43
- "र": 12,
44
- "ल": 6,
45
- "व": 46,
46
- "श": 40,
47
- "ष": 18,
48
- "स": 54,
49
- "ह": 4,
50
- "ा": 27,
51
- "ि": 29,
52
- "ी": 32,
53
- "ु": 59,
54
- "ू": 19,
55
- "ृ": 53,
56
- "े": 0,
57
- "ै": 37,
58
- "ो": 3,
59
- "ौ": 23,
60
- "्": 52,
61
- "।": 33,
62
- "–": 45,
63
- "’": 5
64
  }
 
1
  {
2
  "[PAD]": 61,
3
  "[UNK]": 60,
4
+ "|": 27,
5
+ "ँ": 11,
6
+ "ं": 22,
7
+ "ः": 29,
8
+ "अ": 6,
9
+ "आ": 44,
10
+ "इ": 26,
11
+ "ई": 34,
12
+ "उ": 23,
13
+ "ऊ": 19,
14
+ "ए": 4,
15
+ "ओ": 21,
16
+ "औ": 43,
17
+ "क": 58,
18
+ "ख": 17,
19
+ "ग": 12,
20
+ "घ": 52,
21
+ "ङ": 57,
22
+ "च": 32,
23
+ "छ": 33,
24
+ "ज": 59,
25
+ "झ": 2,
26
+ "ञ": 31,
27
+ "ट": 7,
28
+ "ठ": 1,
29
+ "ड": 30,
30
+ "ढ": 36,
31
+ "ण": 41,
32
+ "त": 37,
33
+ "थ": 47,
34
+ "द": 10,
35
+ "ध": 56,
36
+ "न": 46,
37
+ "प": 54,
38
+ "फ": 28,
39
+ "ब": 9,
40
+ "भ": 35,
41
+ "म": 48,
42
+ "य": 49,
43
+ "र": 3,
44
+ "ल": 8,
45
+ "व": 53,
46
+ "श": 51,
47
+ "ष": 0,
48
+ "स": 38,
49
+ "ह": 16,
50
+ "ा": 15,
51
+ "ि": 50,
52
+ "ी": 45,
53
+ "ु": 39,
54
+ "ू": 25,
55
+ "ृ": 20,
56
+ "े": 42,
57
+ "ै": 40,
58
+ "ो": 18,
59
+ "ौ": 5,
60
+ "्": 14,
61
+ "।": 13,
62
+ "–": 55,
63
+ "’": 24
64
  }