multistral-tokenizer / tokenizer_config.json
damfle
mod: improve compression and remove garbage
a2385fe unverified
raw
history blame contribute delete
432 Bytes
{
"backend": "tokenizers",
"bos_token": "<|begin|>",
"eos_token": "<|return|>",
"extra_special_tokens": [
"<|start|>",
"<|channel|>",
"<|end|>",
"<|message|>",
"<|image|>",
"<|video|>",
"<|audio|>",
"<|call|>",
"<|constrain|>"
],
"model_max_length": 1000000000000000019884624838656,
"pad_token": "<|pad|>",
"tokenizer_class": "MultistralTokenizer",
"unk_token": "<|unknown|>"
}