Upload 4 files

Files changed (4) hide show

README.md CHANGED Viewed

@@ -1,3 +1,25 @@
----
-license: apache-2.0
----

+---
+license: apache-2.0
+language:
+  - zh
+tags:
+  - speaker-verification
+  - speaker-recognition
+  - speaker-embedding
+  - speech
+  - audio
+  - campplus
+pipeline_tag: audio-classification
+---
+# CAMPPlus Speaker Encoder
+This directory contains a local copy of the CAMPPlus speaker verification model, originally released through ModelScope / 3D-Speaker. The model is used to extract speaker embeddings from speech, while the original model architecture, weights, authorship, and license remain attributed to the original authors.
+The upstream 3D-Speaker project is released under the `Apache-2.0` license. When using, redistributing, or citing these files, please keep the original author information, model link, and license notice.
+Original links:
+- ModelScope: https://www.modelscope.cn/models/iic/speech_campplus_sv_zh-cn_16k-common
+- 3D-Speaker: https://github.com/modelscope/3D-Speaker
+- License: https://www.apache.org/licenses/LICENSE-2.0

campplus_cn_common.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:55ffb1a55d04bac4a9b7ed80497cb731909985c9b55d120fce04b851a697886c
+size 14173135

config.yaml ADDED Viewed

+# This is an example that demonstrates how to configure a model file.
+# You can modify the configuration according to your own requirements.
+# to print the register_table:
+# from funasr.register import tables
+# tables.print()
+# network architecture
+model: CAMPPlus
+model_conf:
+    feat_dim: 80
+    embedding_size: 192
+    growth_rate: 32
+    bn_size: 4
+    init_channels: 128
+    config_str: 'batchnorm-relu'
+    memory_efficient: True
+    output_level: 'segment'
+# frontend related
+frontend: WavFrontend
+frontend_conf:
+    fs: 16000

configuration.json ADDED Viewed

+{
+    "framework": "pytorch",
+    "task": "speaker-verification",
+    "model_config": "config.yaml",
+    "model_file": "campplus_cn_common.bin",
+    "model": {
+        "type": "cam++-sv",
+        "model_config": {
+            "sample_rate": 16000,
+            "fbank_dim": 80,
+            "emb_size": 192
+        },
+        "pretrained_model": "campplus_cn_common.bin",
+        "yesOrno_thr": 0.31
+    },
+    "pipeline": {
+        "type": "speaker-verification"
+    },
+    "file_path_metas": {
+        "init_param":"campplus_cn_common.bin",
+        "config":"config.yaml"
+    }
+}