Upload 2 files
Browse files
RSB_VE_05231038/config.yml
ADDED
|
@@ -0,0 +1,44 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
audio_length: 16000
|
| 2 |
+
batch_size: 16
|
| 3 |
+
bridge_type: VE
|
| 4 |
+
checkpoints_total_limit: 3
|
| 5 |
+
dataset: voicebank
|
| 6 |
+
datasets:
|
| 7 |
+
voicebank: /root/Voicebank+Demand
|
| 8 |
+
dummy: false
|
| 9 |
+
ema_rate: 0.999
|
| 10 |
+
evaluate_batch_size: 16
|
| 11 |
+
generative_backbone: ncsnpp_base
|
| 12 |
+
hop_length: 128
|
| 13 |
+
learning_rate: 0.0001
|
| 14 |
+
load_posterior_mean: true
|
| 15 |
+
log_steps: 10
|
| 16 |
+
log_with: wandb
|
| 17 |
+
loss_weight_type: constant
|
| 18 |
+
n_fft: 510
|
| 19 |
+
normalize_audio: true
|
| 20 |
+
num_epoch: 1000
|
| 21 |
+
num_frames: 256
|
| 22 |
+
num_steps: 163592
|
| 23 |
+
optimizer: Adam
|
| 24 |
+
output_path: /root/runs/RSB_VE_05231038
|
| 25 |
+
patience: 50
|
| 26 |
+
predictive_backbone: ncsnpp_base
|
| 27 |
+
reduction: sum
|
| 28 |
+
regulization_type: quadratic
|
| 29 |
+
resume: false
|
| 30 |
+
run_dir: /root/runs
|
| 31 |
+
run_id: rsb0523103830
|
| 32 |
+
run_name: RSB_VE_05231038
|
| 33 |
+
sample_rate: 16000
|
| 34 |
+
save_state_steps: 1000
|
| 35 |
+
seed: 10
|
| 36 |
+
spatial_channels: 1
|
| 37 |
+
spec_abs_exponent: 0.5
|
| 38 |
+
spec_factor: 0.33
|
| 39 |
+
t_max: 1
|
| 40 |
+
t_min: 0.0001
|
| 41 |
+
time_loss_weight: 0.001
|
| 42 |
+
training_method: regulization
|
| 43 |
+
training_target: data
|
| 44 |
+
window: sqrthann
|
RSB_VE_05231038/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ec32096f76dd0f828bc22f4d3163f5b921eaf7d5b8d3b04073908328959dce4
|
| 3 |
+
size 111054536
|