yuchenxie
/

ArlowGPT-Tokenizer

Model card Files Files and versions

ArlowGPT-Tokenizer / tokenizer_config.json

yuchenxie's picture

Upload ArlowGPT-Tokenizer

71ccf1e verified over 1 year ago

history blame contribute delete

1.06 kB

	{
	"tokenizer_class": "PreTrainedTokenizerFast",
	"name_or_path": "tokenizer.json",
	"model_max_length": 131072,
	"errors": "replace",
	"add_bos_token": false,
	"add_prefix_space": false,
	"clean_up_tokenization_spaces": false,
	"additional_special_tokens": [
	"<\|mask\|>"
	],
	"bos_token": "<\|startoftext\|>",
	"eos_token": "<\|endoftext\|>",
	"unk_token": "<\|unk\|>",
	"pad_token": "<\|pad\|>",
	"chat_template": "{%- if messages[0]['role'] == 'system' %}\n<\|im_start\|>system\nYou are ArlowGPT made by Yuchen Xie. You are a helpful assistant in which you respond to users query without neglecting.\n<\|im_end\|>\n{%- else %}\n<\|im_start\|>system\nYou are ArlowGPT made by Yuchen Xie. You are a helpful assistant in which you respond to users query without neglecting.\n<\|im_end\|>\n{%- endif %}\n\n{%- for message in messages %}\n {%- if message.role == 'user' %}\n<\|im_start\|>user\n{{ message.content }}\n<\|im_end\|>\n {%- elif message.role == 'assistant' %}\n<\|im_start\|>assistant\n{{ message.content }}\n<\|im_end\|>\n {%- endif %}\n{%- endfor %}"
	}