| channels: 16 |
| n_layers: 22 |
| n_heads: 40 |
| n_kv_heads: 20 |
| d_model: 2560 |
| mlp_ratio: 5 |
| mlp_gradient_checkpointing: true |
| causal: true |
| n_buttons: 256 |
| tokens_per_frame: 256 |
| height: 16 |
| width: 16 |
| patch: |
| - 2 |
| - 2 |
| base_fps: 60 |
| local_window: 16 |
| global_window: 128 |
| global_pinned_dilation: 8 |
| global_attn_period: 4 |
| global_attn_offset: 0 |
| value_residual: false |
| n_frames: 800 |
| rope_impl: ortho |
| gated_attn: true |
| noise_conditioning: wan |
| ctrl_conditioning: mlp_fusion |
| ctrl_cond_dropout: 0.0 |
| ctrl_conditioning_period: 3 |
| prompt_conditioning: cross_attention |
| prompt_cond_dropout: 0.0 |
| prompt_embedding_dim: 2048 |
| prompt_conditioning_period: 3 |
| block_gradient_checkpointing: true |
| scheduler_sigmas: |
| - 1.0 |
| - 0.8609585762023926 |
| - 0.729332447052002 |
| - 0.3205108940601349 |
| - 0.0 |
| ae_uri: "OpenWorldLabs/owl_vae_f16_c16_distill_v0_nogan" |