| { |
| "_class_name": "AutoencoderKLWan", |
| "_diffusers_version": "0.35.0.dev0", |
| "attn_scales": [], |
| "base_dim": 160, |
| "clip_output": false, |
| "decoder_base_dim": 256, |
| "dim_mult": [ |
| 1, |
| 2, |
| 4, |
| 4 |
| ], |
| "dropout": 0.0, |
| "in_channels": 12, |
| "is_residual": true, |
| "latents_mean": [ |
| -0.2289, |
| -0.0052, |
| -0.1323, |
| -0.2339, |
| -0.2799, |
| 0.0174, |
| 0.1838, |
| 0.1557, |
| -0.1382, |
| 0.0542, |
| 0.2813, |
| 0.0891, |
| 0.157, |
| -0.0098, |
| 0.0375, |
| -0.1825, |
| -0.2246, |
| -0.1207, |
| -0.0698, |
| 0.5109, |
| 0.2665, |
| -0.2108, |
| -0.2158, |
| 0.2502, |
| -0.2055, |
| -0.0322, |
| 0.1109, |
| 0.1567, |
| -0.0729, |
| 0.0899, |
| -0.2799, |
| -0.123, |
| -0.0313, |
| -0.1649, |
| 0.0117, |
| 0.0723, |
| -0.2839, |
| -0.2083, |
| -0.052, |
| 0.3748, |
| 0.0152, |
| 0.1957, |
| 0.1433, |
| -0.2944, |
| 0.3573, |
| -0.0548, |
| -0.1681, |
| -0.0667 |
| ], |
| "latents_std": [ |
| 0.4765, |
| 1.0364, |
| 0.4514, |
| 1.1677, |
| 0.5313, |
| 0.499, |
| 0.4818, |
| 0.5013, |
| 0.8158, |
| 1.0344, |
| 0.5894, |
| 1.0901, |
| 0.6885, |
| 0.6165, |
| 0.8454, |
| 0.4978, |
| 0.5759, |
| 0.3523, |
| 0.7135, |
| 0.6804, |
| 0.5833, |
| 1.4146, |
| 0.8986, |
| 0.5659, |
| 0.7069, |
| 0.5338, |
| 0.4889, |
| 0.4917, |
| 0.4069, |
| 0.4999, |
| 0.6866, |
| 0.4093, |
| 0.5709, |
| 0.6065, |
| 0.6415, |
| 0.4944, |
| 0.5726, |
| 1.2042, |
| 0.5458, |
| 1.6887, |
| 0.3971, |
| 1.06, |
| 0.3943, |
| 0.5537, |
| 0.5444, |
| 0.4089, |
| 0.7468, |
| 0.7744 |
| ], |
| "num_res_blocks": 2, |
| "out_channels": 12, |
| "patch_size": 2, |
| "scale_factor_spatial": 16, |
| "scale_factor_temporal": 4, |
| "temperal_downsample": [ |
| false, |
| true, |
| true |
| ], |
| "z_dim": 48 |
| } |
|
|