mlabonne
/

TwinLlama-3.1-8B-DPO

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

mlabonne commited on Oct 6

Commit

adc761e

•

1 Parent(s): d7cd5a8

Upload tokenizer

Files changed (3) hide show

special_tokens_map.json +1 -1
tokenizer.json +1 -1
tokenizer_config.json +7 -5

special_tokens_map.json CHANGED Viewed

@@ -7,7 +7,7 @@
     "single_word": false
   },
   "eos_token": {
-    "content": "<|im_end|>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,

     "single_word": false
   },
   "eos_token": {
+    "content": "<|end_of_text|>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,

tokenizer.json CHANGED Viewed

@@ -14,7 +14,7 @@
     },
     {
       "id": 128001,
-      "content": "<|im_end|>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

     },
     {
       "id": 128001,
+      "content": "<|end_of_text|>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -9,7 +9,7 @@
       "special": true
     },
     "128001": {
-      "content": "<|im_end|>",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
@@ -2050,12 +2050,14 @@
     }
   },
   "bos_token": "<|begin_of_text|>",
-  "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<|im_start|>user\n' + message['content'] + '<|im_end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|im_start|>assistant\n' + message['content'] + '<|im_end|>\n' }}{% else %}{{ '<|im_start|>system\n' + message['content'] + '<|im_end|>\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
   "clean_up_tokenization_spaces": true,
-  "eos_token": "<|im_end|>",
   "model_max_length": 131072,
   "pad_token": "<|finetune_right_pad_id|>",
   "padding_side": "left",
-  "tokenizer_class": "PreTrainedTokenizerFast",
-  "unk_token": null
 }

       "special": true
     },
     "128001": {
+      "content": "<|end_of_text|>",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
     }
   },
   "bos_token": "<|begin_of_text|>",
   "clean_up_tokenization_spaces": true,
+  "eos_token": "<|end_of_text|>",
+  "model_input_names": [
+    "input_ids",
+    "attention_mask"
+  ],
   "model_max_length": 131072,
   "pad_token": "<|finetune_right_pad_id|>",
   "padding_side": "left",
+  "tokenizer_class": "PreTrainedTokenizerFast"
 }