internlm2_5-7b-chat / tokenizer_config.json
ArthurZ's picture
ArthurZ HF Staff
Add converted tokenizer (no trust_remote_code needed)
f9afffb verified
Raw
History Blame
677 Bytes
{
"auto_map": {
"AutoTokenizer": [
"tokenization_internlm2.InternLM2Tokenizer",
"tokenization_internlm2_fast.InternLM2TokenizerFast"
]
},
"backend": "tokenizers",
"bos_token": "<s>",
"clean_up_tokenization_spaces": false,
"decode_with_prefix_space": false,
"eos_token": "</s>",
"extra_special_tokens": [
"<|im_start|>",
"<|im_end|>",
"<|action_start|>",
"<|action_end|>",
"<|interpreter|>",
"<|plugin|>"
],
"is_local": false,
"model_max_length": 1000000000000000019884624838656,
"pad_token": "</s>",
"sp_model_kwargs": null,
"tokenizer_class": "TokenizersBackend",
"unk_id": 0,
"unk_token": "<unk>"
}