rossevine commited on
Commit
62394b1
1 Parent(s): 40d6322

Upload tokenizer

Browse files
Files changed (3) hide show
  1. added_tokens.json +2 -3
  2. special_tokens_map.json +0 -7
  3. vocab.json +2 -0
added_tokens.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "</s>": 28,
3
- "<s>": 27,
4
- "[PAD]": 29
5
  }
 
1
  {
2
+ "</s>": 30,
3
+ "<s>": 29
 
4
  }
special_tokens_map.json CHANGED
@@ -13,13 +13,6 @@
13
  "normalized": true,
14
  "rstrip": false,
15
  "single_word": false
16
- },
17
- {
18
- "content": "[PAD]",
19
- "lstrip": false,
20
- "normalized": true,
21
- "rstrip": false,
22
- "single_word": false
23
  }
24
  ],
25
  "bos_token": "<s>",
 
13
  "normalized": true,
14
  "rstrip": false,
15
  "single_word": false
 
 
 
 
 
 
 
16
  }
17
  ],
18
  "bos_token": "<s>",
vocab.json CHANGED
@@ -1,4 +1,6 @@
1
  {
 
 
2
  "a": 1,
3
  "b": 2,
4
  "c": 3,
 
1
  {
2
+ "[PAD]": 28,
3
+ "[UNK]": 27,
4
  "a": 1,
5
  "b": 2,
6
  "c": 3,