AksaraLLM-20B / tokenizer_config.json
Ezekiel999's picture
Publish architecture config + tokenizer + roadmap (weights pending v5p-128 pretrain)
88202f1 verified
raw
history blame contribute delete
534 Bytes
{
"add_bos_token": false,
"add_eos_token": false,
"added_tokens_decoder": {},
"bos_token": "<|bos|>",
"clean_up_tokenization_spaces": false,
"eos_token": "<|eos|>",
"model_max_length": 131072,
"pad_token": "<|pad|>",
"tokenizer_class": "PreTrainedTokenizerFast",
"unk_token": "<|unk|>",
"chat_template": "{% for message in messages %}{{ '<|im_start|>' + message['role'] + '\\n' + message['content'] + '<|im_end|>' + '\\n' }}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\\n' }}{% endif %}"
}