Text-to-Video
Diffusers
Safetensors
English
efficient
mobile video generation
dit
pyramidal diffusion
File size: 1,026 Bytes
2eb1cd8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
{
  "_class_name": "AsymmetricCausalVideoVAE",
  "_diffusers_version": "0.34.0.dev0",
  "decoder_num_features": [
    256,
    128,
    64,
    64
  ],
  "decoder_space_upscale": [ 
    true, 
    true, 
    true 
  ],
  "decoder_time_upscale": [ 
    true, 
    true, 
    true 
  ],
  "encoder_act_fn": "silu",
  "encoder_block_dropout": [
    0.0,
    0.0,
    0.0,
    0.0
  ],
  "encoder_block_out_channels": [
    128,
    256,
    512,
    512
  ],
  "encoder_down_block_types": [
    "DownEncoderBlockCausal3D",
    "DownEncoderBlockCausal3D",
    "DownEncoderBlockCausal3D",
    "DownEncoderBlockCausal3D"
  ],
  "encoder_in_channels": 3,
  "encoder_layers_per_block": [
    2,
    2,
    2,
    2
  ],
  "encoder_norm_num_groups": 32,
  "encoder_out_channels": 16,
  "encoder_spatial_down_sample": [
    true,
    true,
    true,
    false
  ],
  "encoder_temporal_down_sample": [
    true,
    true,
    true,
    false
  ],
  "sample_size": 256,
  "spatial_downsample_scale": 8,
  "temporal_downsample_scale": 8
}