Text-to-Video
Diffusers
Safetensors
English
efficient
mobile video generation
dit
pyramidal diffusion
karnewar commited on
Commit
2eb1cd8
·
verified ·
1 Parent(s): 3816384

causal-video-vae component added

Browse files
causal_video_vae/config.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AsymmetricCausalVideoVAE",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "decoder_num_features": [
5
+ 256,
6
+ 128,
7
+ 64,
8
+ 64
9
+ ],
10
+ "decoder_space_upscale": [
11
+ true,
12
+ true,
13
+ true
14
+ ],
15
+ "decoder_time_upscale": [
16
+ true,
17
+ true,
18
+ true
19
+ ],
20
+ "encoder_act_fn": "silu",
21
+ "encoder_block_dropout": [
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0
26
+ ],
27
+ "encoder_block_out_channels": [
28
+ 128,
29
+ 256,
30
+ 512,
31
+ 512
32
+ ],
33
+ "encoder_down_block_types": [
34
+ "DownEncoderBlockCausal3D",
35
+ "DownEncoderBlockCausal3D",
36
+ "DownEncoderBlockCausal3D",
37
+ "DownEncoderBlockCausal3D"
38
+ ],
39
+ "encoder_in_channels": 3,
40
+ "encoder_layers_per_block": [
41
+ 2,
42
+ 2,
43
+ 2,
44
+ 2
45
+ ],
46
+ "encoder_norm_num_groups": 32,
47
+ "encoder_out_channels": 16,
48
+ "encoder_spatial_down_sample": [
49
+ true,
50
+ true,
51
+ true,
52
+ false
53
+ ],
54
+ "encoder_temporal_down_sample": [
55
+ true,
56
+ true,
57
+ true,
58
+ false
59
+ ],
60
+ "sample_size": 256,
61
+ "spatial_downsample_scale": 8,
62
+ "temporal_downsample_scale": 8
63
+ }
causal_video_vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:413f1e98fe0611bf78853acad28ca653ce2768577cfe9822420f4eafd3cb1cf1
3
+ size 239107038