| |
|
|
| |
| |
| |
| defaults: |
| - musicgen/default |
| - /model: lm/musicgen_lm |
| - override /dset: audio/default |
| - _self_ |
|
|
| lm_model: transformer_lm_magnet |
| solver: magnet |
|
|
| autocast: true |
| autocast_dtype: float16 |
|
|
| |
| |
| |
| |
| compression_model_checkpoint: //pretrained/facebook/encodec_32khz |
|
|
| efficient_attention_backend: xformers |
|
|
| channels: 1 |
| sample_rate: 32000 |
|
|
| deadlock: |
| use: true |
|
|
| dataset: |
| batch_size: 192 |
| sample_on_weight: false |
| sample_on_duration: false |
|
|
| optim: |
| epochs: 500 |
| optimizer: dadam |
| lr: 1 |
| ema: |
| use: true |
| updates: 10 |
| device: cuda |
|
|
| logging: |
| log_tensorboard: true |
|
|
| schedule: |
| lr_scheduler: cosine |
| cosine: |
| warmup: 4000 |
| lr_min_ratio: 0.0 |
| cycle_length: 1.0 |
|
|
| codebooks_pattern: |
| modeling: parallel |
| parallel: |
| empty_initial: -1 |
| |
| transformer_lm: |
| card: 2048 |
| causal: false |
| subcodes_context: 5 |
| compression_model_framerate: 50 |
| segment_duration: 0 |
| span_len: -1 |
|
|
| masking: |
| span_len: 3 |
|
|
| generate: |
| lm: |
| max_prompt_len: null |
| max_gen_len: null |
| remove_prompts: false |
| use_sampling: true |
| temp: 3.0 |
| top_k: 0 |
| top_p: 0.9 |
| max_cfg_coef: 10.0 |
| min_cfg_coef: 1.0 |
| decoding_steps: [60, 10, 10, 10] |
| anneal_temp: true |
| span_scoring: 'max' |
| span_arrangement: 'nonoverlap' |
| prompted_samples: false |
| samples: |
| prompted: false |
| unprompted: true |
|
|