phi3-spin-phi3-data / tokenizer_config.json
AmberYifan's picture
Training in progress, step 100
9990e81 verified
raw
history blame
743 Bytes
{
"_commit_hash": "69caae1f2acea34b26f535fecb1f2abb9a304695",
"_from_auto": true,
"added_tokens_decoder": {},
"auto_map": {
"AutoTokenizer": [
"tokenization_phi3_small.Phi3SmallTokenizer",
"tokenization_phi3_small.Phi3SmallTokenizer"
]
},
"bos_token": "<|endoftext|>",
"chat_template": "{{ bos_token }}{% for message in messages %}{{'<|' + message['role'] + '|>' + '\n' + message['content'] + '<|end|>\n' }}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
"clean_up_tokenization_spaces": true,
"eos_token": "<|endoftext|>",
"model_max_length": 8192,
"pad_token": "<|endoftext|>",
"revision": "main",
"tokenizer_class": "Phi3SmallTokenizer"
}