Duplicate from schismaudio/scnet-base
Browse filesCo-authored-by: Zak Keown <zkeown@users.noreply.huggingface.co>
- .gitattributes +35 -0
- README.md +34 -0
- v1.0.0/SCNet_Base.mlmodelc/analytics/coremldata.bin +3 -0
- v1.0.0/SCNet_Base.mlmodelc/coremldata.bin +3 -0
- v1.0.0/SCNet_Base.mlmodelc/metadata.json +84 -0
- v1.0.0/SCNet_Base.mlmodelc/model.mil +0 -0
- v1.0.0/SCNet_Base.mlmodelc/weights/weight.bin +3 -0
- v1.0.0/SCNet_Base_metadata.json +24 -0
- v1.0.0/metadata.json +24 -0
.gitattributes
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- coreml
|
| 4 |
+
- audio
|
| 5 |
+
- music-source-separation
|
| 6 |
+
- schism
|
| 7 |
+
license: mit
|
| 8 |
+
---
|
| 9 |
+
|
| 10 |
+
# SCNet Base
|
| 11 |
+
|
| 12 |
+
CoreML model for [Schism](https://github.com/zakkeown/Schism) audio separation framework.
|
| 13 |
+
|
| 14 |
+
SCNet Base (~10M params) for 4-stem separation
|
| 15 |
+
|
| 16 |
+
## Details
|
| 17 |
+
|
| 18 |
+
| Property | Value |
|
| 19 |
+
|----------|-------|
|
| 20 |
+
| Expert IDs | scnet-base |
|
| 21 |
+
| Tasks | stemSeparation, vocalSeparation |
|
| 22 |
+
| Quality | medium |
|
| 23 |
+
| Est. RTF | 0.6 |
|
| 24 |
+
| Peak Memory | 1024 MB |
|
| 25 |
+
|
| 26 |
+
## Usage
|
| 27 |
+
|
| 28 |
+
Install to your local Schism model store:
|
| 29 |
+
|
| 30 |
+
```bash
|
| 31 |
+
schism models install scnet-base
|
| 32 |
+
```
|
| 33 |
+
|
| 34 |
+
Or manually place in `~/.schism/models/scnet-base/v1.0.0/`.
|
v1.0.0/SCNet_Base.mlmodelc/analytics/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b92a92964af1166f1d0f0e4178faa870bf40f71ee863b35df3f7ba9837497428
|
| 3 |
+
size 243
|
v1.0.0/SCNet_Base.mlmodelc/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:968b4fed2a6c1b045ed5139b19f77b63de99ce66cc14722180bbed8a30ac6641
|
| 3 |
+
size 385
|
v1.0.0/SCNet_Base.mlmodelc/metadata.json
ADDED
|
@@ -0,0 +1,84 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"metadataOutputVersion" : "3.0",
|
| 4 |
+
"storagePrecision" : "Float32",
|
| 5 |
+
"outputSchema" : [
|
| 6 |
+
{
|
| 7 |
+
"hasShapeFlexibility" : "0",
|
| 8 |
+
"isOptional" : "0",
|
| 9 |
+
"dataType" : "Float32",
|
| 10 |
+
"formattedType" : "MultiArray (Float32 1 × 16 × 2049 × 476)",
|
| 11 |
+
"shortDescription" : "",
|
| 12 |
+
"shape" : "[1, 16, 2049, 476]",
|
| 13 |
+
"name" : "separated",
|
| 14 |
+
"type" : "MultiArray"
|
| 15 |
+
}
|
| 16 |
+
],
|
| 17 |
+
"modelParameters" : [
|
| 18 |
+
|
| 19 |
+
],
|
| 20 |
+
"specificationVersion" : 8,
|
| 21 |
+
"mlProgramOperationTypeHistogram" : {
|
| 22 |
+
"Ios17.square" : 48,
|
| 23 |
+
"Ios17.reshape" : 156,
|
| 24 |
+
"Ios16.reduceMean" : 96,
|
| 25 |
+
"Ios17.matmul" : 12,
|
| 26 |
+
"Ios17.transpose" : 84,
|
| 27 |
+
"Split" : 21,
|
| 28 |
+
"Ios17.convTranspose" : 9,
|
| 29 |
+
"Ios17.add" : 117,
|
| 30 |
+
"Ios16.sigmoid" : 21,
|
| 31 |
+
"Ios17.sliceByIndex" : 32,
|
| 32 |
+
"Tile" : 3,
|
| 33 |
+
"Pad" : 8,
|
| 34 |
+
"Ios17.gather" : 12,
|
| 35 |
+
"Ios17.batchNorm" : 12,
|
| 36 |
+
"Ios16.silu" : 18,
|
| 37 |
+
"Ios17.sqrt" : 48,
|
| 38 |
+
"Ios17.sub" : 51,
|
| 39 |
+
"Ios17.conv" : 69,
|
| 40 |
+
"Ios17.realDiv" : 48,
|
| 41 |
+
"Ios17.linear" : 12,
|
| 42 |
+
"Ios17.concat" : 15,
|
| 43 |
+
"Ios16.gelu" : 9,
|
| 44 |
+
"Ios17.lstm" : 12,
|
| 45 |
+
"Ios17.mul" : 72
|
| 46 |
+
},
|
| 47 |
+
"computePrecision" : "Mixed (Float32, Int32)",
|
| 48 |
+
"isUpdatable" : "0",
|
| 49 |
+
"stateSchema" : [
|
| 50 |
+
|
| 51 |
+
],
|
| 52 |
+
"availability" : {
|
| 53 |
+
"macOS" : "14.0",
|
| 54 |
+
"tvOS" : "17.0",
|
| 55 |
+
"visionOS" : "1.0",
|
| 56 |
+
"watchOS" : "10.0",
|
| 57 |
+
"iOS" : "17.0",
|
| 58 |
+
"macCatalyst" : "17.0"
|
| 59 |
+
},
|
| 60 |
+
"modelType" : {
|
| 61 |
+
"name" : "MLModelType_mlProgram"
|
| 62 |
+
},
|
| 63 |
+
"userDefinedMetadata" : {
|
| 64 |
+
"com.github.apple.coremltools.conversion_date" : "2026-02-05",
|
| 65 |
+
"com.github.apple.coremltools.source" : "torch==2.7.0",
|
| 66 |
+
"com.github.apple.coremltools.version" : "9.0",
|
| 67 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript"
|
| 68 |
+
},
|
| 69 |
+
"inputSchema" : [
|
| 70 |
+
{
|
| 71 |
+
"hasShapeFlexibility" : "0",
|
| 72 |
+
"isOptional" : "0",
|
| 73 |
+
"dataType" : "Float32",
|
| 74 |
+
"formattedType" : "MultiArray (Float32 1 × 4 × 2049 × 476)",
|
| 75 |
+
"shortDescription" : "",
|
| 76 |
+
"shape" : "[1, 4, 2049, 476]",
|
| 77 |
+
"name" : "spectrogram",
|
| 78 |
+
"type" : "MultiArray"
|
| 79 |
+
}
|
| 80 |
+
],
|
| 81 |
+
"generatedClassName" : "SCNet_Base",
|
| 82 |
+
"method" : "predict"
|
| 83 |
+
}
|
| 84 |
+
]
|
v1.0.0/SCNet_Base.mlmodelc/model.mil
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
v1.0.0/SCNet_Base.mlmodelc/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d008b13e384c589ae7720924c9fb47802fdddeef23d4946e40f010ee0f11ef3
|
| 3 |
+
size 45230464
|
v1.0.0/SCNet_Base_metadata.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"variant": "base",
|
| 3 |
+
"precision": "float32",
|
| 4 |
+
"n_sources": 4,
|
| 5 |
+
"sources": [
|
| 6 |
+
"drums",
|
| 7 |
+
"bass",
|
| 8 |
+
"other",
|
| 9 |
+
"vocals"
|
| 10 |
+
],
|
| 11 |
+
"frequency_bins": 2049,
|
| 12 |
+
"time_frames": 476,
|
| 13 |
+
"stft": {
|
| 14 |
+
"n_fft": 4096,
|
| 15 |
+
"hop_length": 1024,
|
| 16 |
+
"win_length": 4096,
|
| 17 |
+
"center": true,
|
| 18 |
+
"normalized": true
|
| 19 |
+
},
|
| 20 |
+
"input_channels": 4,
|
| 21 |
+
"output_channels": 16,
|
| 22 |
+
"chunk_samples": 485100,
|
| 23 |
+
"sample_rate": 44100
|
| 24 |
+
}
|
v1.0.0/metadata.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"expertId": "scnet-base",
|
| 3 |
+
"name": "SCNet Base",
|
| 4 |
+
"version": "1.0.0",
|
| 5 |
+
"tasks": [
|
| 6 |
+
"stemSeparation",
|
| 7 |
+
"vocalSeparation"
|
| 8 |
+
],
|
| 9 |
+
"qualityTier": "medium",
|
| 10 |
+
"estimatedRTF": 0.6,
|
| 11 |
+
"peakMemoryMB": 1024,
|
| 12 |
+
"inputKind": "mix",
|
| 13 |
+
"outputKind": "stems",
|
| 14 |
+
"sourceRepo": "schismaudio/scnet-base",
|
| 15 |
+
"outputStems": [
|
| 16 |
+
"drums",
|
| 17 |
+
"bass",
|
| 18 |
+
"other",
|
| 19 |
+
"vocals"
|
| 20 |
+
],
|
| 21 |
+
"expertIds": [
|
| 22 |
+
"scnet-base"
|
| 23 |
+
]
|
| 24 |
+
}
|