nextgencodex1 commited on
Commit
6112e2e
·
verified ·
1 Parent(s): 7b8d63a

Initial upload of kinyarwanda-ASR model

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Mbaza-ASR-Afrivoice-660h/Mbaza-ASR-Afrivoice-660h.nemo filter=lfs diff=lfs merge=lfs -text
Mbaza-ASR-Afrivoice-660h/.gitattributes ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Speech_To_Text_Finetuning.nemo filter=lfs diff=lfs merge=lfs -text
37
+ nemo_kin_pretrained_800h_retrained_tokenizer.nemo filter=lfs diff=lfs merge=lfs -text
38
+ Mbaza-ASR-Afrivoice-660h.nemo filter=lfs diff=lfs merge=lfs -text
Mbaza-ASR-Afrivoice-660h/Mbaza-ASR-Afrivoice-660h.nemo ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe4de5a3988e138d4b939bfa3a7cdacb511f2adec21821d78ff4886a22a68d95
3
+ size 486707200
Mbaza-ASR-Afrivoice-660h/README.md ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - rw
4
+ license: cc-by-4.0
5
+ library_name: nemo
6
+ datasets:
7
+ - DigitalUmuganda/Afrivoice_Kinyarwanda
8
+ thumbnail: null
9
+ tags:
10
+ - automatic-speech-recognition
11
+ - speech
12
+ - audio
13
+ - CTC
14
+ - Conformer
15
+ - NeMo
16
+ - pytorch
17
+
18
+ ---
19
+
20
+
21
+ ## Model Overview
22
+
23
+ <DESCRIBE IN ONE LINE THE MODEL AND ITS USE>
24
+
25
+ ## Dependencies
26
+
27
+ To train, fine-tune or play with the model you will need to install [NVIDIA NeMo](https://github.com/NVIDIA/NeMo).
28
+
29
+ For inference just run:
30
+ ```
31
+ pip install nemo_toolkit['all']
32
+ ```
33
+
34
+ ## How to Use this Model
35
+
36
+ The model is available for use in the NeMo toolkit, and can be used as a pre-trained checkpoint for inference or for fine-tuning on another dataset.
37
+
38
+ ### Load the model weights
39
+
40
+ ```python
41
+ import nemo.collections.asr as nemo_asr
42
+ asr_model = nemo_asr.models.ASRModel.from_pretrained("DigitalUmuganda/Mbaza-ASR-Afrivoice-660h")
43
+ ```
44
+
45
+ ### Transcribing using Python
46
+
47
+ ```
48
+ asr_model.transcribe(['<audio_sample>'])
49
+ ```
50
+
51
+ ### Transcribing many audio files
52
+
53
+ ```shell
54
+ python [NEMO_GIT_FOLDER]/examples/asr/transcribe_speech.py pretrained_name="DigitalUmuganda/nemo_kin_pretrained_800h_retrained_tokenizer" audio_dir="<DIRECTORY CONTAINING AUDIO FILES>"
55
+ ```
56
+
57
+ ### Input
58
+
59
+ This model accepts 16000 KHz Mono-channel Audio (wav files) as input.
60
+
61
+
62
+