mega-asr-onnx / examples_mels /manifest.json
Reza2kn's picture
Update manifest: add forced-language prompts (default: English)
1566056 verified
{
"examples": {
"noise": {
"T_mel": 868
},
"far_field": {
"T_mel": 592
},
"obstructed": {
"T_mel": 880
},
"distortion": {
"T_mel": 736
},
"recording": {
"T_mel": 500
},
"echo": {
"T_mel": 748
},
"dropout": {
"T_mel": 668
},
"mixed": {
"T_mel": 508
}
},
"prompt_ids": [
151644,
8948,
198,
151645,
198,
151644,
872,
198,
151669,
151676,
151670,
151645,
198,
151644,
77091,
198,
11528,
6364,
151704
],
"prompt_text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage English<asr_text>",
"audio_pad_id": 151676,
"eos_token_id": 151645,
"prompts": {
"auto": {
"text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\n",
"ids": [
151644,
8948,
198,
151645,
198,
151644,
872,
198,
151669,
151676,
151670,
151645,
198,
151644,
77091,
198
]
},
"english": {
"text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage English<asr_text>",
"ids": [
151644,
8948,
198,
151645,
198,
151644,
872,
198,
151669,
151676,
151670,
151645,
198,
151644,
77091,
198,
11528,
6364,
151704
]
},
"chinese": {
"text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage Chinese<asr_text>",
"ids": [
151644,
8948,
198,
151645,
198,
151644,
872,
198,
151669,
151676,
151670,
151645,
198,
151644,
77091,
198,
11528,
8453,
151704
]
},
"japanese": {
"text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage Japanese<asr_text>",
"ids": [
151644,
8948,
198,
151645,
198,
151644,
872,
198,
151669,
151676,
151670,
151645,
198,
151644,
77091,
198,
11528,
10769,
151704
]
},
"korean": {
"text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage Korean<asr_text>",
"ids": [
151644,
8948,
198,
151645,
198,
151644,
872,
198,
151669,
151676,
151670,
151645,
198,
151644,
77091,
198,
11528,
16134,
151704
]
}
}
}