| { |
| "_class_name": "CVVAEModel", |
| "_diffusers_version": "0.26.3", |
| "attn_resolutions": [], |
| "causal_decoder": false, |
| "causal_encoder": true, |
| "ch": 128, |
| "ch_mult": [ |
| 1, |
| 2, |
| 4, |
| 4 |
| ], |
| "decoder_attn_type": "spatial-temporal-xformer", |
| "double_z": true, |
| "dropout": 0.0, |
| "en_de_n_frames_a_time": 16, |
| "encoder_attn_type": "vanilla-xformers", |
| "half_3d": true, |
| "in_channels": 3, |
| "num_res_blocks": 2, |
| "num_video_frames": null, |
| "out_ch": 3, |
| "scaling_factor": 0.18215, |
| "force_upcast": true, |
| "reshape_x_dim_to_4": false, |
| "reshape_z_dim_to_4": false, |
| "spatial_n_compress": 8, |
| "tile_overlap_ratio": 0.2222, |
| "tile_spatial_size": 576, |
| "time_n_compress": 4, |
| "use_3d_conv": true, |
| "z_channels": 4 |
| } |
|
|