Automatic Speech Recognition
ONNX
Transformers.js
onnxruntime
qwen3_asr
text-generation
onnxruntime-web
asr
speech-recognition
robust-asr
quantized
int4
int8
matmulnbits
gptq
on-device
browser
web
qwen3
qwen3-asr
mega-asr
Instructions to use Reza2kn/mega-asr-onnx with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers.js
How to use Reza2kn/mega-asr-onnx with Transformers.js:
// npm i @huggingface/transformers import { pipeline } from '@huggingface/transformers'; // Allocate pipeline const pipe = await pipeline('automatic-speech-recognition', 'Reza2kn/mega-asr-onnx');
| { | |
| "examples": { | |
| "noise": { | |
| "T_mel": 868 | |
| }, | |
| "far_field": { | |
| "T_mel": 592 | |
| }, | |
| "obstructed": { | |
| "T_mel": 880 | |
| }, | |
| "distortion": { | |
| "T_mel": 736 | |
| }, | |
| "recording": { | |
| "T_mel": 500 | |
| }, | |
| "echo": { | |
| "T_mel": 748 | |
| }, | |
| "dropout": { | |
| "T_mel": 668 | |
| }, | |
| "mixed": { | |
| "T_mel": 508 | |
| } | |
| }, | |
| "prompt_ids": [ | |
| 151644, | |
| 8948, | |
| 198, | |
| 151645, | |
| 198, | |
| 151644, | |
| 872, | |
| 198, | |
| 151669, | |
| 151676, | |
| 151670, | |
| 151645, | |
| 198, | |
| 151644, | |
| 77091, | |
| 198, | |
| 11528, | |
| 6364, | |
| 151704 | |
| ], | |
| "prompt_text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage English<asr_text>", | |
| "audio_pad_id": 151676, | |
| "eos_token_id": 151645, | |
| "prompts": { | |
| "auto": { | |
| "text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\n", | |
| "ids": [ | |
| 151644, | |
| 8948, | |
| 198, | |
| 151645, | |
| 198, | |
| 151644, | |
| 872, | |
| 198, | |
| 151669, | |
| 151676, | |
| 151670, | |
| 151645, | |
| 198, | |
| 151644, | |
| 77091, | |
| 198 | |
| ] | |
| }, | |
| "english": { | |
| "text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage English<asr_text>", | |
| "ids": [ | |
| 151644, | |
| 8948, | |
| 198, | |
| 151645, | |
| 198, | |
| 151644, | |
| 872, | |
| 198, | |
| 151669, | |
| 151676, | |
| 151670, | |
| 151645, | |
| 198, | |
| 151644, | |
| 77091, | |
| 198, | |
| 11528, | |
| 6364, | |
| 151704 | |
| ] | |
| }, | |
| "chinese": { | |
| "text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage Chinese<asr_text>", | |
| "ids": [ | |
| 151644, | |
| 8948, | |
| 198, | |
| 151645, | |
| 198, | |
| 151644, | |
| 872, | |
| 198, | |
| 151669, | |
| 151676, | |
| 151670, | |
| 151645, | |
| 198, | |
| 151644, | |
| 77091, | |
| 198, | |
| 11528, | |
| 8453, | |
| 151704 | |
| ] | |
| }, | |
| "japanese": { | |
| "text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage Japanese<asr_text>", | |
| "ids": [ | |
| 151644, | |
| 8948, | |
| 198, | |
| 151645, | |
| 198, | |
| 151644, | |
| 872, | |
| 198, | |
| 151669, | |
| 151676, | |
| 151670, | |
| 151645, | |
| 198, | |
| 151644, | |
| 77091, | |
| 198, | |
| 11528, | |
| 10769, | |
| 151704 | |
| ] | |
| }, | |
| "korean": { | |
| "text": "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|audio_start|><|audio_pad|><|audio_end|><|im_end|>\n<|im_start|>assistant\nlanguage Korean<asr_text>", | |
| "ids": [ | |
| 151644, | |
| 8948, | |
| 198, | |
| 151645, | |
| 198, | |
| 151644, | |
| 872, | |
| 198, | |
| 151669, | |
| 151676, | |
| 151670, | |
| 151645, | |
| 198, | |
| 151644, | |
| 77091, | |
| 198, | |
| 11528, | |
| 16134, | |
| 151704 | |
| ] | |
| } | |
| } | |
| } |