TaurenMountain
/

FormalASR-1.7B

Safetensors

qwen3_asr

Model card Files Files and versions

xet

Community

Wendy9805 commited on 2 days ago

Commit

6f0d3ac

verified ·

1 Parent(s): 041de5d

Upload README.md with huggingface_hub

Browse files

Files changed (1) hide show

README.md +27 -35

README.md CHANGED Viewed

@@ -37,33 +37,31 @@ FormalASR-1.7B is a fine-tuned ASR (Automatic Speech Recognition) model based on
 ## Usage
 ### HuggingFace
 ```python
 import torch
-from transformers import AutoProcessor, AutoModelForSpeechSeq2Seq
-model_id = "TaurenMountain/FormalASR-1.7B"
-processor = AutoProcessor.from_pretrained(model_id)
-model = AutoModelForSpeechSeq2Seq.from_pretrained(
-    model_id,
-    torch_dtype=torch.bfloat16,
-    device_map="auto"
 )
-# Load audio (16kHz, mono)
-import librosa
-audio, sr = librosa.load("your_audio.wav", sr=16000)
-inputs = processor(audio, sampling_rate=16000, return_tensors="pt")
-inputs = {k: v.to(model.device) for k, v in inputs.items()}
-with torch.no_grad():
-    generated_ids = model.generate(**inputs)
-transcription = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
-print(transcription)
 ```
 ### 魔搭社区（ModelScope）
@@ -71,30 +69,24 @@ print(transcription)
 ```python
 import torch
 from modelscope import snapshot_download
-from transformers import AutoProcessor, AutoModelForSpeechSeq2Seq
 # 下载模型到本地（首次运行自动下载）
 model_dir = snapshot_download("TaurenMountain/FormalASR-1.7B")
-processor = AutoProcessor.from_pretrained(model_dir)
-model = AutoModelForSpeechSeq2Seq.from_pretrained(
     model_dir,
-    torch_dtype=torch.bfloat16,
-    device_map="auto"
 )
-# Load audio (16kHz, mono)
-import librosa
-audio, sr = librosa.load("your_audio.wav", sr=16000)
-inputs = processor(audio, sampling_rate=16000, return_tensors="pt")
-inputs = {k: v.to(model.device) for k, v in inputs.items()}
-with torch.no_grad():
-    generated_ids = model.generate(**inputs)
-transcription = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
-print(transcription)
 ```
 ## Training Details

 ## Usage
+### Installation
+```bash
+pip install -U qwen-asr
+```
 ### HuggingFace
 ```python
 import torch
+from qwen_asr import Qwen3ASRModel
+model = Qwen3ASRModel.from_pretrained(
+    "TaurenMountain/FormalASR-1.7B",
+    dtype=torch.bfloat16,
+    device_map="cuda:0",
+    max_new_tokens=512,
 )
+results = model.transcribe(
+    audio="your_audio.wav",
+    language="Chinese",
+)
+print(results[0].text)
 ```
 ### 魔搭社区（ModelScope）
 ```python
 import torch
 from modelscope import snapshot_download
+from qwen_asr import Qwen3ASRModel
 # 下载模型到本地（首次运行自动下载）
 model_dir = snapshot_download("TaurenMountain/FormalASR-1.7B")
+model = Qwen3ASRModel.from_pretrained(
     model_dir,
+    dtype=torch.bfloat16,
+    device_map="cuda:0",
+    max_new_tokens=512,
 )
+results = model.transcribe(
+    audio="your_audio.wav",
+    language="Chinese",
+)
+print(results[0].text)
 ```
 ## Training Details