mandelakori commited on
Commit
1293aba
1 Parent(s): 1b9753b

Update tokenizer_config.json

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +3 -13
tokenizer_config.json CHANGED
@@ -1,6 +1,4 @@
1
  {
2
- "add_bos_token": true,
3
- "add_eos_token": false,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
@@ -25,24 +23,15 @@
25
  "rstrip": false,
26
  "single_word": false,
27
  "special": true
28
- },
29
- "3": { // Add entry for the instruction token
30
- "content": "<instruction>",
31
- "lstrip": false,
32
- "normalized": false,
33
- "rstrip": false,
34
- "single_word": false,
35
- "special": true
36
  }
37
  },
38
  "additional_special_tokens": [
39
  "<unk>",
40
  "<s>",
41
- "</s>",
42
- "<instruction>" // Add the instruction token here
43
  ],
44
  "bos_token": "<s>",
45
- "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '' }}\n{% endif %}\n{% endfor %}",
46
  "clean_up_tokenization_spaces": false,
47
  "eos_token": "</s>",
48
  "legacy": true,
@@ -55,3 +44,4 @@
55
  "unk_token": "<unk>",
56
  "use_default_system_prompt": true
57
  }
 
 
1
  {
 
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<unk>",
 
23
  "rstrip": false,
24
  "single_word": false,
25
  "special": true
 
 
 
 
 
 
 
 
26
  }
27
  },
28
  "additional_special_tokens": [
29
  "<unk>",
30
  "<s>",
31
+ "</s>"
 
32
  ],
33
  "bos_token": "<s>",
34
+ "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
35
  "clean_up_tokenization_spaces": false,
36
  "eos_token": "</s>",
37
  "legacy": true,
 
44
  "unk_token": "<unk>",
45
  "use_default_system_prompt": true
46
  }
47
+