drbaph commited on
Commit
20305c0
·
verified ·
1 Parent(s): d3614d9

Upload 12 files

Browse files
TextConditionerA/config.yaml ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ exclude_from_checkpoint: false
2
+ trainable: false
3
+ sentence_config:
4
+ frozen: false
5
+ model: roberta-large
6
+ max_sentence_tokens: 77
7
+ adopt_n_layers: 0
8
+ adopt_layer_size: 2048
9
+ pool_type: eos
10
+ add_pooling_layer: true
11
+ hidden_dropout_prob: 0.1
12
+ attention_probs_dropout_prob: 0.1
13
+ finetune_n_layers: -1
14
+ last_hidden_state: true
15
+ use_shared_space: false
16
+ normalize_shared_space: true
17
+ freeze_clap: true
18
+ lhs_index: -2
19
+ remove_special_tokens: false
20
+ eval_mode: true
21
+ text_preprocessing: no_op
22
+ shared_representation_size: 1024
TextConditionerA/weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f66e1877efd49e3198068ffac74d00a84df18e53189643373e2e777224856bb
3
+ size 1425689504
TextConditionerV/config.yaml ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ exclude_from_checkpoint: false
2
+ trainable: false
3
+ sentence_config:
4
+ frozen: false
5
+ model: roberta-large
6
+ max_sentence_tokens: 77
7
+ adopt_n_layers: 0
8
+ adopt_layer_size: 2048
9
+ pool_type: eos
10
+ add_pooling_layer: true
11
+ hidden_dropout_prob: 0.1
12
+ attention_probs_dropout_prob: 0.1
13
+ finetune_n_layers: -1
14
+ last_hidden_state: true
15
+ use_shared_space: false
16
+ normalize_shared_space: true
17
+ freeze_clap: true
18
+ lhs_index: -2
19
+ remove_special_tokens: false
20
+ eval_mode: true
21
+ text_preprocessing: no_op
22
+ shared_representation_size: 1024
TextConditionerV/weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0dd912c322582cb95531de69cf1472c90752e468087a3b0fc461dea49975e80
3
+ size 1425689504
Woosh-DFlow/config.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ exclude_from_checkpoint: false
2
+ trainable: true
3
+ ldm:
4
+ exclude_from_checkpoint: false
5
+ trainable: true
6
+ model_type: LatentDiffusionModel
7
+ dit:
8
+ model_type: mmmssflux
9
+ rope_len_multiplier: 2
10
+ max_description_length: 77
11
+ max_seq_len: 501
12
+ dim: 1024
13
+ inter_dim: 4096
14
+ fixed_timestep_features: false
15
+ timestep_features_dim: 256
16
+ n_layers: 12
17
+ n_heads: 8
18
+ n_multimodal_layers: 6
19
+ qk_nope_head_dim: 16
20
+ qk_rope_head_dim: 112
21
+ qkv_head_dim: 128
22
+ n_memory_tokens_rope: 1
23
+ n_memory_tokens_description: 0
24
+ original_seq_len: 501
25
+ rope_theta: 10000.0
26
+ rope_factor: 40.0
27
+ beta_fast: 32
28
+ beta_slow: 1
29
+ io_channels: 128
30
+ cond_token_dim: 1024
31
+ adaln_last_layer: true
32
+ adaln_last_layer_nomod: false
33
+ non_checkpoint_layers: 14
34
+ mask_out_before: -1
35
+ estimate_logvar: true
36
+ no_description_mask: true
37
+ symmetric_attention_init: false
38
+ patch_size: 1
39
+ num_sinks: 0
40
+ mlp_act: gelu
41
+ conditioners:
42
+ text:
43
+ exclude_from_checkpoint: true
44
+ trainable: false
45
+ path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/TextConditionerA
46
+ autoencoder:
47
+ exclude_from_checkpoint: true
48
+ trainable: false
49
+ path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/Woosh-AE
50
+ sigma_data: 1.0
51
+ pred_type: v_pred
Woosh-DFlow/weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9fc4a2220fa4ba54e01611afe58e061854a58ad559eb56de2cca39112f7c8ef
3
+ size 1378890620
Woosh-DVFlow-8s/config.yaml ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ exclude_from_checkpoint: false
2
+ trainable: true
3
+ pretrained_model_type: videokontext
4
+ ldm:
5
+ exclude_from_checkpoint: false
6
+ trainable: true
7
+ model_type: VideoKontextLDM
8
+ ldm:
9
+ exclude_from_checkpoint: false
10
+ trainable: true
11
+ dit:
12
+ model_type: mmmssflux
13
+ max_description_length: 77
14
+ max_seq_len: 501
15
+ rope_len_multiplier: 2
16
+ dim: 1024
17
+ inter_dim: 4096
18
+ fixed_timestep_features: false
19
+ timestep_features_dim: 256
20
+ n_layers: 12
21
+ n_heads: 8
22
+ n_multimodal_layers: 6
23
+ qk_nope_head_dim: 16
24
+ qk_rope_head_dim: 112
25
+ qkv_head_dim: 128
26
+ n_memory_tokens_rope: 1
27
+ n_memory_tokens_description: 0
28
+ original_seq_len: 501
29
+ rope_theta: 10000.0
30
+ rope_factor: 40.0
31
+ beta_fast: 32
32
+ beta_slow: 1
33
+ io_channels: 128
34
+ cond_token_dim: 1024
35
+ adaln_last_layer: true
36
+ adaln_last_layer_nomod: false
37
+ non_checkpoint_layers: 14
38
+ mask_out_before: -1
39
+ estimate_logvar: true
40
+ no_description_mask: true
41
+ symmetric_attention_init: false
42
+ patch_size: 1
43
+ num_sinks: 0
44
+ mlp_act: gelu
45
+ conditioners:
46
+ text:
47
+ exclude_from_checkpoint: true
48
+ trainable: false
49
+ path: checkpoints/TextConditionerV
50
+ autoencoder:
51
+ exclude_from_checkpoint: true
52
+ trainable: false
53
+ path: checkpoints/Woosh-AE
54
+ sigma_data: 1.0
55
+ pred_type: v_pred
56
+ audio_fps: 100
57
+ video_fps: 24
58
+ embed_dim: 768
59
+ embed_key: synch_out
60
+ pts_seconds_key: synch_pts_seconds
61
+ non_checkpoint_layers: 14
62
+ n_layers_encoder: 0
63
+ trainable_no_cond: false
64
+ use_batch_mask: true
Woosh-DVFlow-8s/weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c87b796798fd96a4a3b1deeb70ccd05c6dc782fe546b622ce1368a05e441cd30
3
+ size 1684261500
Woosh-Flow/config.yaml ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ exclude_from_checkpoint: false
2
+ trainable: true
3
+ model_type: LatentDiffusionModel
4
+ dit:
5
+ model_type: mmmssflux
6
+ rope_len_multiplier: 2
7
+ max_description_length: 77
8
+ max_seq_len: 501
9
+ dim: 1024
10
+ inter_dim: 4096
11
+ fixed_timestep_features: false
12
+ timestep_features_dim: 256
13
+ n_layers: 12
14
+ n_heads: 8
15
+ n_multimodal_layers: 6
16
+ qk_nope_head_dim: 16
17
+ qk_rope_head_dim: 112
18
+ qkv_head_dim: 128
19
+ n_memory_tokens_rope: 1
20
+ n_memory_tokens_description: 0
21
+ original_seq_len: 501
22
+ rope_theta: 10000.0
23
+ rope_factor: 40.0
24
+ beta_fast: 32
25
+ beta_slow: 1
26
+ io_channels: 128
27
+ cond_token_dim: 1024
28
+ adaln_last_layer: true
29
+ adaln_last_layer_nomod: false
30
+ non_checkpoint_layers: 14
31
+ mask_out_before: -1
32
+ estimate_logvar: true
33
+ no_description_mask: true
34
+ symmetric_attention_init: false
35
+ patch_size: 1
36
+ num_sinks: 0
37
+ mlp_act: gelu
38
+ conditioners:
39
+ text:
40
+ exclude_from_checkpoint: true
41
+ trainable: false
42
+ path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/TextConditionerA
43
+ autoencoder:
44
+ exclude_from_checkpoint: true
45
+ trainable: false
46
+ path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/Woosh-AE
47
+ sigma_data: 1.0
48
+ pred_type: v_pred
Woosh-Flow/weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e2eafa2f9063934859888a2edd25ad4485f82dca4caaa7720f98d832f7ca39b
3
+ size 1348979404
Woosh-VFlow-8s/config.yaml ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ exclude_from_checkpoint: false
2
+ trainable: true
3
+ model_type: VideoKontextLDM
4
+ ldm:
5
+ exclude_from_checkpoint: false
6
+ trainable: true
7
+ dit:
8
+ model_type: mmmssflux
9
+ max_description_length: 77
10
+ max_seq_len: 501
11
+ rope_len_multiplier: 2
12
+ dim: 1024
13
+ inter_dim: 4096
14
+ fixed_timestep_features: false
15
+ timestep_features_dim: 256
16
+ n_layers: 12
17
+ n_heads: 8
18
+ n_multimodal_layers: 6
19
+ qk_nope_head_dim: 16
20
+ qk_rope_head_dim: 112
21
+ qkv_head_dim: 128
22
+ n_memory_tokens_rope: 1
23
+ n_memory_tokens_description: 0
24
+ original_seq_len: 501
25
+ rope_theta: 10000.0
26
+ rope_factor: 40.0
27
+ beta_fast: 32
28
+ beta_slow: 1
29
+ io_channels: 128
30
+ cond_token_dim: 1024
31
+ adaln_last_layer: true
32
+ adaln_last_layer_nomod: false
33
+ non_checkpoint_layers: 14
34
+ mask_out_before: -1
35
+ estimate_logvar: true
36
+ no_description_mask: true
37
+ symmetric_attention_init: false
38
+ patch_size: 1
39
+ num_sinks: 0
40
+ mlp_act: gelu
41
+ conditioners:
42
+ text:
43
+ exclude_from_checkpoint: true
44
+ trainable: false
45
+ path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/TextConditionerV
46
+ autoencoder:
47
+ exclude_from_checkpoint: true
48
+ trainable: false
49
+ path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/Woosh-AE
50
+ sigma_data: 1.0
51
+ pred_type: v_pred
52
+ audio_fps: 100
53
+ video_fps: 24
54
+ embed_dim: 768
55
+ embed_key: synch_out
56
+ pts_seconds_key: synch_pts_seconds
57
+ non_checkpoint_layers: 14
58
+ n_layers_encoder: 0
59
+ trainable_no_cond: false
60
+ use_batch_mask: true
Woosh-VFlow-8s/weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed2e7639e830060e532c955d4b4dc23869c8574605267846fa326c28730fcc7d
3
+ size 1654350276