| { |
| "added_tokens_decoder": { |
| "2": { |
| "content": "tʰ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "3": { |
| "content": "tɕ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "4": { |
| "content": "tɕ*", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "5": { |
| "content": "tɕʰ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "8": { |
| "content": "k*", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "9": { |
| "content": "kʰ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "14": { |
| "content": "t*", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "15": { |
| "content": "p*", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "16": { |
| "content": "pʰ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "18": { |
| "content": "s*", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "23": { |
| "content": "wɛ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "27": { |
| "content": "ɰi", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "28": { |
| "content": "jo", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "29": { |
| "content": "ju", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "30": { |
| "content": "ja", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "31": { |
| "content": "jʌ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "32": { |
| "content": "jɛ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "33": { |
| "content": "wa", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "34": { |
| "content": "wʌ", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "35": { |
| "content": "wi", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "37": { |
| "content": "[UNK]", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "38": { |
| "content": "[PAD]", |
| "lstrip": true, |
| "normalized": false, |
| "rstrip": true, |
| "single_word": false, |
| "special": false |
| }, |
| "39": { |
| "content": "<s>", |
| "lstrip": false, |
| "normalized": false, |
| "rstrip": false, |
| "single_word": false, |
| "special": true |
| }, |
| "40": { |
| "content": "</s>", |
| "lstrip": false, |
| "normalized": false, |
| "rstrip": false, |
| "single_word": false, |
| "special": true |
| } |
| }, |
| "bos_token": "<s>", |
| "clean_up_tokenization_spaces": true, |
| "do_lower_case": false, |
| "do_normalize": true, |
| "eos_token": "</s>", |
| "model_max_length": 1000000000000000019884624838656, |
| "pad_token": "[PAD]", |
| "replace_word_delimiter_char": " ", |
| "return_attention_mask": false, |
| "target_lang": null, |
| "tokenizer_class": "Wav2Vec2CTCTokenizer", |
| "unk_token": "[UNK]", |
| "word_delimiter_token": "|" |
| } |
|
|