| { |
| "model_type": "echo_tts", |
| "sample_rate": 44100, |
| "max_text_length": 768, |
| "max_speaker_latent_length": 6400, |
| "audio_downsample_factor": 2048, |
| "normalize_text": true, |
| "delete_blockwise_modules": false, |
| "pca_filename": "pca_state.safetensors", |
| "fish_codec_repo": "jordand/fish-s1-dac-min", |
| "model_path": "mlx_echo_tts_base", |
| "dit": { |
| "latent_size": 80, |
| "model_size": 2048, |
| "num_layers": 24, |
| "num_heads": 16, |
| "intermediate_size": 5888, |
| "norm_eps": 1e-05, |
| "text_vocab_size": 256, |
| "text_model_size": 1280, |
| "text_num_layers": 14, |
| "text_num_heads": 10, |
| "text_intermediate_size": 3328, |
| "speaker_patch_size": 4, |
| "speaker_model_size": 1280, |
| "speaker_num_layers": 14, |
| "speaker_num_heads": 10, |
| "speaker_intermediate_size": 3328, |
| "timestep_embed_size": 512, |
| "adaln_rank": 256 |
| }, |
| "sampler": { |
| "num_steps": 40, |
| "cfg_scale_text": 3.0, |
| "cfg_scale_speaker": 8.0, |
| "cfg_min_t": 0.5, |
| "cfg_max_t": 1.0, |
| "truncation_factor": null, |
| "rescale_k": null, |
| "rescale_sigma": null, |
| "speaker_kv_scale": null, |
| "speaker_kv_max_layers": null, |
| "speaker_kv_min_t": null, |
| "sequence_length": 640 |
| } |
| } |