Publish architecture config + tokenizer + roadmap (weights pending v5p-128 pretrain)
88202f1 verified | { | |
| "add_bos_token": false, | |
| "add_eos_token": false, | |
| "added_tokens_decoder": {}, | |
| "bos_token": "<|bos|>", | |
| "clean_up_tokenization_spaces": false, | |
| "eos_token": "<|eos|>", | |
| "model_max_length": 131072, | |
| "pad_token": "<|pad|>", | |
| "tokenizer_class": "PreTrainedTokenizerFast", | |
| "unk_token": "<|unk|>", | |
| "chat_template": "{% for message in messages %}{{ '<|im_start|>' + message['role'] + '\\n' + message['content'] + '<|im_end|>' + '\\n' }}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\\n' }}{% endif %}" | |
| } |