niobures commited on
Commit
37d6450
·
verified ·
1 Parent(s): 91b64dd

VoiceFixer (code, dataset, models, paper)

Browse files
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ code/VoxFilter-Downloads/releases/desktop-v1.1.6/VoxFilter-1.1.6-Windows.exe filter=lfs diff=lfs merge=lfs -text
37
+ code/VoxFilter-Downloads/releases/desktop-v1.1.6/VoxFilter-1.1.6-Windows.exe.blockmap filter=lfs diff=lfs merge=lfs -text
38
+ VoiceFixer.[[:space:]]Toward[[:space:]]General[[:space:]]Speech[[:space:]]Restoration[[:space:]]with[[:space:]]Neural[[:space:]]Vocoder.pdf filter=lfs diff=lfs merge=lfs -text
VoiceFixer. Toward General Speech Restoration with Neural Vocoder.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:891ea3d1dbe08ab404a100646e80ad45acb9752df6e013354ca0179ab855b43f
3
+ size 17557957
code/VoxFilter-Downloads/releases/desktop-v1.1.6/VoxFilter-1.1.6-Windows.exe ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ba3cf1afaeff5df2db0f21ac3031978774cea7b16168454f85bcf260e8aa797
3
+ size 125924856
code/VoxFilter-Downloads/releases/desktop-v1.1.6/VoxFilter-1.1.6-Windows.exe.blockmap ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d03292ebb4a67beee03578d742b2402a774a7f102e507de10c059b0d2b7edf0
3
+ size 130971
code/VoxFilter-Downloads/releases/desktop-v1.1.6/VoxFilter-Downloads-desktop-v1.1.6.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d36ddeb45c5e892ad041f8757e37949a75b50e1446d03dd3a983bb7fca630c2
3
+ size 408
code/VoxFilter-Downloads/source.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ https://github.com/herrychokshi-ops/VoxFilter-Downloads
code/voicefixer-add_cuda_option.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6c507ee44e933ad32a4ba05046cd9e21026a8c8cb41418af73ceb10752d6407
3
+ size 2045035
code/voicefixer-command-line.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:087c228dd1573808dcf4c9048f40a8568ed29753057a242c417d5b7995933f79
3
+ size 2044645
code/voicefixer-dev.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc5abddb42a9d99b5b0161057a5e39bf7be1d70f094ef6064bc108dfe34e09e
3
+ size 2040498
code/voicefixer-haoheliu-patch-1.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c2be04960148b21a3ebf6e721317728516ea1972b9c08a42848ad8b560614b4
3
+ size 2292045
code/voicefixer-windows_compability.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c953415c9f5568f770e5511d858424b5d9bd43f532371670c08dbdcfb1b87af
3
+ size 2289639
code/voicefixer.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c559c260f027d9525054e52853189a5adafb6e01c0c2362b573434f51c9ef5d
3
+ size 6363472
code/voicefixer_main.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99650597c8a5abe93bf07932f7e3944572c59b5822ce40849427c2b1dcb78c50
3
+ size 27366758
dataset/GSR_and_SSR_testsets.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2de0ff5b3349bc86e5e42a359921fb8cb5a0589675cd45e36059026eb0f13dea
3
+ size 2340507365
dataset/Train_and_test_set_RIR.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199c6588e6bce13d65be78cc3984d85882a4ce2516ef9f07a1bdef3d844a0494
3
+ size 2944848262
dataset/Train_set_noise.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c13c93ac40a3ae0e48ff9e7dc9f4a3e290f4ff6010699ca195c19f74df4e802
3
+ size 3223799729
dataset/Train_set_speech.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58455f57382f221937cf2a3865f95995c1e88066770ef9518366f04bc4d2aeb9
3
+ size 5565208399
dataset/source.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ https://zenodo.org/records/5546723
models/VoiceFixer/.gitattributes ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ftz filter=lfs diff=lfs merge=lfs -text
6
+ *.gz filter=lfs diff=lfs merge=lfs -text
7
+ *.h5 filter=lfs diff=lfs merge=lfs -text
8
+ *.joblib filter=lfs diff=lfs merge=lfs -text
9
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
10
+ *.model filter=lfs diff=lfs merge=lfs -text
11
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
12
+ *.npy filter=lfs diff=lfs merge=lfs -text
13
+ *.npz filter=lfs diff=lfs merge=lfs -text
14
+ *.onnx filter=lfs diff=lfs merge=lfs -text
15
+ *.ot filter=lfs diff=lfs merge=lfs -text
16
+ *.parquet filter=lfs diff=lfs merge=lfs -text
17
+ *.pb filter=lfs diff=lfs merge=lfs -text
18
+ *.pickle filter=lfs diff=lfs merge=lfs -text
19
+ *.pkl filter=lfs diff=lfs merge=lfs -text
20
+ *.pt filter=lfs diff=lfs merge=lfs -text
21
+ *.pth filter=lfs diff=lfs merge=lfs -text
22
+ *.rar filter=lfs diff=lfs merge=lfs -text
23
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
24
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
25
+ *.tflite filter=lfs diff=lfs merge=lfs -text
26
+ *.tgz filter=lfs diff=lfs merge=lfs -text
27
+ *.wasm filter=lfs diff=lfs merge=lfs -text
28
+ *.xz filter=lfs diff=lfs merge=lfs -text
29
+ *.zip filter=lfs diff=lfs merge=lfs -text
30
+ *.zst filter=lfs diff=lfs merge=lfs -text
31
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
models/VoiceFixer/model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:748411b70089cadf34a6c11054f95f3a454e614af562c23b13a82f6cb413109f
3
+ size 489307071
models/VoiceFixer/source.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ https://huggingface.co/huseinzol05/VoiceFixer
models/voicefixer-models/.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
models/voicefixer-models/README.md ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # VoiceFixer Models
2
+
3
+ Official VoiceFixer model checkpoints for speech restoration, mirrored for faster
4
+ downloads.
5
+
6
+ ## Why This Repository?
7
+
8
+ The official VoiceFixer models are hosted on Zenodo, which can have slow download
9
+ speeds. This repository mirrors the same official models on HuggingFace for:
10
+ - Faster downloads via HuggingFace CDN
11
+ - Better integration with HuggingFace-based projects
12
+ - Improved reliability and availability
13
+
14
+ ## Models Included
15
+
16
+ - `vf.ckpt` (466.6 MB) - Analysis module for speech restoration
17
+ - `model.ckpt-1490000_trimed.pt` (129.3 MB) - Vocoder module (44.1kHz)
18
+
19
+ ## Usage
20
+
21
+ Used by [TTS Audio Suite](https://github.com/diodiogod/TTS-Audio-Suite) for ComfyUI
22
+ audio restoration.
23
+
24
+ ## Attribution
25
+
26
+ Original models by Haohe Liu et al.
27
+
28
+ - **Paper**: [VoiceFixer: Toward General Speech
29
+ Restoration](https://arxiv.org/abs/2109.13731)
30
+ - **GitHub**: https://github.com/haoheliu/voicefixer
31
+ - **Original Zenodo Release**: https://zenodo.org/record/5600188
32
+
33
+ ## License
34
+
35
+ CC-BY-4.0 (same as original release)
36
+
37
+ These models are identical to the official Zenodo release, mirrored here for
38
+ convenience.
models/voicefixer-models/model.ckpt-1490000_trimed.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9410d0b528c10a251ae947bd299d1939b0b3247df680c81c4164e94f5d87dc45
3
+ size 135613039
models/voicefixer-models/source.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ https://huggingface.co/Diogodiogod/voicefixer-models
models/voicefixer-models/vf.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:748411b70089cadf34a6c11054f95f3a454e614af562c23b13a82f6cb413109f
3
+ size 489307071