FrankTCH commited on
Commit
2f3ebda
1 Parent(s): 7772f28

Upload tokenizer

Browse files
Files changed (2) hide show
  1. added_tokens.json +2 -2
  2. vocab.json +17 -20
added_tokens.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
- "</s>": 38,
3
- "<s>": 37
4
  }
 
1
  {
2
+ "</s>": 35,
3
+ "<s>": 34
4
  }
vocab.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "tur": {
3
- "[PAD]": 36,
4
- "[UNK]": 35,
5
  "a": 1,
6
  "b": 2,
7
  "c": 3,
@@ -18,24 +18,21 @@
18
  "n": 14,
19
  "o": 15,
20
  "p": 16,
21
- "q": 17,
22
- "r": 18,
23
- "s": 19,
24
- "t": 20,
25
- "u": 21,
26
- "v": 22,
27
- "w": 23,
28
- "x": 24,
29
- "y": 25,
30
- "z": 26,
31
  "|": 0,
32
- "ç": 27,
33
- "ë": 28,
34
- "ö": 29,
35
- "ü": 30,
36
- "ğ": 31,
37
- "ı": 32,
38
- "ş": 33,
39
- "̇": 34
40
  }
41
  }
 
1
  {
2
  "tur": {
3
+ "[PAD]": 33,
4
+ "[UNK]": 32,
5
  "a": 1,
6
  "b": 2,
7
  "c": 3,
 
18
  "n": 14,
19
  "o": 15,
20
  "p": 16,
21
+ "r": 17,
22
+ "s": 18,
23
+ "t": 19,
24
+ "u": 20,
25
+ "v": 21,
26
+ "w": 22,
27
+ "y": 23,
28
+ "z": 24,
 
 
29
  "|": 0,
30
+ "ç": 25,
31
+ "ö": 26,
32
+ "ü": 27,
33
+ "ğ": 28,
34
+ "ı": 29,
35
+ "ş": 30,
36
+ "̇": 31
 
37
  }
38
  }