Upload 12 files
Browse files- TextConditionerA/config.yaml +22 -0
- TextConditionerA/weights.safetensors +3 -0
- TextConditionerV/config.yaml +22 -0
- TextConditionerV/weights.safetensors +3 -0
- Woosh-DFlow/config.yaml +51 -0
- Woosh-DFlow/weights.safetensors +3 -0
- Woosh-DVFlow-8s/config.yaml +64 -0
- Woosh-DVFlow-8s/weights.safetensors +3 -0
- Woosh-Flow/config.yaml +48 -0
- Woosh-Flow/weights.safetensors +3 -0
- Woosh-VFlow-8s/config.yaml +60 -0
- Woosh-VFlow-8s/weights.safetensors +3 -0
TextConditionerA/config.yaml
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
exclude_from_checkpoint: false
|
| 2 |
+
trainable: false
|
| 3 |
+
sentence_config:
|
| 4 |
+
frozen: false
|
| 5 |
+
model: roberta-large
|
| 6 |
+
max_sentence_tokens: 77
|
| 7 |
+
adopt_n_layers: 0
|
| 8 |
+
adopt_layer_size: 2048
|
| 9 |
+
pool_type: eos
|
| 10 |
+
add_pooling_layer: true
|
| 11 |
+
hidden_dropout_prob: 0.1
|
| 12 |
+
attention_probs_dropout_prob: 0.1
|
| 13 |
+
finetune_n_layers: -1
|
| 14 |
+
last_hidden_state: true
|
| 15 |
+
use_shared_space: false
|
| 16 |
+
normalize_shared_space: true
|
| 17 |
+
freeze_clap: true
|
| 18 |
+
lhs_index: -2
|
| 19 |
+
remove_special_tokens: false
|
| 20 |
+
eval_mode: true
|
| 21 |
+
text_preprocessing: no_op
|
| 22 |
+
shared_representation_size: 1024
|
TextConditionerA/weights.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f66e1877efd49e3198068ffac74d00a84df18e53189643373e2e777224856bb
|
| 3 |
+
size 1425689504
|
TextConditionerV/config.yaml
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
exclude_from_checkpoint: false
|
| 2 |
+
trainable: false
|
| 3 |
+
sentence_config:
|
| 4 |
+
frozen: false
|
| 5 |
+
model: roberta-large
|
| 6 |
+
max_sentence_tokens: 77
|
| 7 |
+
adopt_n_layers: 0
|
| 8 |
+
adopt_layer_size: 2048
|
| 9 |
+
pool_type: eos
|
| 10 |
+
add_pooling_layer: true
|
| 11 |
+
hidden_dropout_prob: 0.1
|
| 12 |
+
attention_probs_dropout_prob: 0.1
|
| 13 |
+
finetune_n_layers: -1
|
| 14 |
+
last_hidden_state: true
|
| 15 |
+
use_shared_space: false
|
| 16 |
+
normalize_shared_space: true
|
| 17 |
+
freeze_clap: true
|
| 18 |
+
lhs_index: -2
|
| 19 |
+
remove_special_tokens: false
|
| 20 |
+
eval_mode: true
|
| 21 |
+
text_preprocessing: no_op
|
| 22 |
+
shared_representation_size: 1024
|
TextConditionerV/weights.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0dd912c322582cb95531de69cf1472c90752e468087a3b0fc461dea49975e80
|
| 3 |
+
size 1425689504
|
Woosh-DFlow/config.yaml
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
exclude_from_checkpoint: false
|
| 2 |
+
trainable: true
|
| 3 |
+
ldm:
|
| 4 |
+
exclude_from_checkpoint: false
|
| 5 |
+
trainable: true
|
| 6 |
+
model_type: LatentDiffusionModel
|
| 7 |
+
dit:
|
| 8 |
+
model_type: mmmssflux
|
| 9 |
+
rope_len_multiplier: 2
|
| 10 |
+
max_description_length: 77
|
| 11 |
+
max_seq_len: 501
|
| 12 |
+
dim: 1024
|
| 13 |
+
inter_dim: 4096
|
| 14 |
+
fixed_timestep_features: false
|
| 15 |
+
timestep_features_dim: 256
|
| 16 |
+
n_layers: 12
|
| 17 |
+
n_heads: 8
|
| 18 |
+
n_multimodal_layers: 6
|
| 19 |
+
qk_nope_head_dim: 16
|
| 20 |
+
qk_rope_head_dim: 112
|
| 21 |
+
qkv_head_dim: 128
|
| 22 |
+
n_memory_tokens_rope: 1
|
| 23 |
+
n_memory_tokens_description: 0
|
| 24 |
+
original_seq_len: 501
|
| 25 |
+
rope_theta: 10000.0
|
| 26 |
+
rope_factor: 40.0
|
| 27 |
+
beta_fast: 32
|
| 28 |
+
beta_slow: 1
|
| 29 |
+
io_channels: 128
|
| 30 |
+
cond_token_dim: 1024
|
| 31 |
+
adaln_last_layer: true
|
| 32 |
+
adaln_last_layer_nomod: false
|
| 33 |
+
non_checkpoint_layers: 14
|
| 34 |
+
mask_out_before: -1
|
| 35 |
+
estimate_logvar: true
|
| 36 |
+
no_description_mask: true
|
| 37 |
+
symmetric_attention_init: false
|
| 38 |
+
patch_size: 1
|
| 39 |
+
num_sinks: 0
|
| 40 |
+
mlp_act: gelu
|
| 41 |
+
conditioners:
|
| 42 |
+
text:
|
| 43 |
+
exclude_from_checkpoint: true
|
| 44 |
+
trainable: false
|
| 45 |
+
path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/TextConditionerA
|
| 46 |
+
autoencoder:
|
| 47 |
+
exclude_from_checkpoint: true
|
| 48 |
+
trainable: false
|
| 49 |
+
path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/Woosh-AE
|
| 50 |
+
sigma_data: 1.0
|
| 51 |
+
pred_type: v_pred
|
Woosh-DFlow/weights.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9fc4a2220fa4ba54e01611afe58e061854a58ad559eb56de2cca39112f7c8ef
|
| 3 |
+
size 1378890620
|
Woosh-DVFlow-8s/config.yaml
ADDED
|
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
exclude_from_checkpoint: false
|
| 2 |
+
trainable: true
|
| 3 |
+
pretrained_model_type: videokontext
|
| 4 |
+
ldm:
|
| 5 |
+
exclude_from_checkpoint: false
|
| 6 |
+
trainable: true
|
| 7 |
+
model_type: VideoKontextLDM
|
| 8 |
+
ldm:
|
| 9 |
+
exclude_from_checkpoint: false
|
| 10 |
+
trainable: true
|
| 11 |
+
dit:
|
| 12 |
+
model_type: mmmssflux
|
| 13 |
+
max_description_length: 77
|
| 14 |
+
max_seq_len: 501
|
| 15 |
+
rope_len_multiplier: 2
|
| 16 |
+
dim: 1024
|
| 17 |
+
inter_dim: 4096
|
| 18 |
+
fixed_timestep_features: false
|
| 19 |
+
timestep_features_dim: 256
|
| 20 |
+
n_layers: 12
|
| 21 |
+
n_heads: 8
|
| 22 |
+
n_multimodal_layers: 6
|
| 23 |
+
qk_nope_head_dim: 16
|
| 24 |
+
qk_rope_head_dim: 112
|
| 25 |
+
qkv_head_dim: 128
|
| 26 |
+
n_memory_tokens_rope: 1
|
| 27 |
+
n_memory_tokens_description: 0
|
| 28 |
+
original_seq_len: 501
|
| 29 |
+
rope_theta: 10000.0
|
| 30 |
+
rope_factor: 40.0
|
| 31 |
+
beta_fast: 32
|
| 32 |
+
beta_slow: 1
|
| 33 |
+
io_channels: 128
|
| 34 |
+
cond_token_dim: 1024
|
| 35 |
+
adaln_last_layer: true
|
| 36 |
+
adaln_last_layer_nomod: false
|
| 37 |
+
non_checkpoint_layers: 14
|
| 38 |
+
mask_out_before: -1
|
| 39 |
+
estimate_logvar: true
|
| 40 |
+
no_description_mask: true
|
| 41 |
+
symmetric_attention_init: false
|
| 42 |
+
patch_size: 1
|
| 43 |
+
num_sinks: 0
|
| 44 |
+
mlp_act: gelu
|
| 45 |
+
conditioners:
|
| 46 |
+
text:
|
| 47 |
+
exclude_from_checkpoint: true
|
| 48 |
+
trainable: false
|
| 49 |
+
path: checkpoints/TextConditionerV
|
| 50 |
+
autoencoder:
|
| 51 |
+
exclude_from_checkpoint: true
|
| 52 |
+
trainable: false
|
| 53 |
+
path: checkpoints/Woosh-AE
|
| 54 |
+
sigma_data: 1.0
|
| 55 |
+
pred_type: v_pred
|
| 56 |
+
audio_fps: 100
|
| 57 |
+
video_fps: 24
|
| 58 |
+
embed_dim: 768
|
| 59 |
+
embed_key: synch_out
|
| 60 |
+
pts_seconds_key: synch_pts_seconds
|
| 61 |
+
non_checkpoint_layers: 14
|
| 62 |
+
n_layers_encoder: 0
|
| 63 |
+
trainable_no_cond: false
|
| 64 |
+
use_batch_mask: true
|
Woosh-DVFlow-8s/weights.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c87b796798fd96a4a3b1deeb70ccd05c6dc782fe546b622ce1368a05e441cd30
|
| 3 |
+
size 1684261500
|
Woosh-Flow/config.yaml
ADDED
|
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
exclude_from_checkpoint: false
|
| 2 |
+
trainable: true
|
| 3 |
+
model_type: LatentDiffusionModel
|
| 4 |
+
dit:
|
| 5 |
+
model_type: mmmssflux
|
| 6 |
+
rope_len_multiplier: 2
|
| 7 |
+
max_description_length: 77
|
| 8 |
+
max_seq_len: 501
|
| 9 |
+
dim: 1024
|
| 10 |
+
inter_dim: 4096
|
| 11 |
+
fixed_timestep_features: false
|
| 12 |
+
timestep_features_dim: 256
|
| 13 |
+
n_layers: 12
|
| 14 |
+
n_heads: 8
|
| 15 |
+
n_multimodal_layers: 6
|
| 16 |
+
qk_nope_head_dim: 16
|
| 17 |
+
qk_rope_head_dim: 112
|
| 18 |
+
qkv_head_dim: 128
|
| 19 |
+
n_memory_tokens_rope: 1
|
| 20 |
+
n_memory_tokens_description: 0
|
| 21 |
+
original_seq_len: 501
|
| 22 |
+
rope_theta: 10000.0
|
| 23 |
+
rope_factor: 40.0
|
| 24 |
+
beta_fast: 32
|
| 25 |
+
beta_slow: 1
|
| 26 |
+
io_channels: 128
|
| 27 |
+
cond_token_dim: 1024
|
| 28 |
+
adaln_last_layer: true
|
| 29 |
+
adaln_last_layer_nomod: false
|
| 30 |
+
non_checkpoint_layers: 14
|
| 31 |
+
mask_out_before: -1
|
| 32 |
+
estimate_logvar: true
|
| 33 |
+
no_description_mask: true
|
| 34 |
+
symmetric_attention_init: false
|
| 35 |
+
patch_size: 1
|
| 36 |
+
num_sinks: 0
|
| 37 |
+
mlp_act: gelu
|
| 38 |
+
conditioners:
|
| 39 |
+
text:
|
| 40 |
+
exclude_from_checkpoint: true
|
| 41 |
+
trainable: false
|
| 42 |
+
path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/TextConditionerA
|
| 43 |
+
autoencoder:
|
| 44 |
+
exclude_from_checkpoint: true
|
| 45 |
+
trainable: false
|
| 46 |
+
path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/Woosh-AE
|
| 47 |
+
sigma_data: 1.0
|
| 48 |
+
pred_type: v_pred
|
Woosh-Flow/weights.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e2eafa2f9063934859888a2edd25ad4485f82dca4caaa7720f98d832f7ca39b
|
| 3 |
+
size 1348979404
|
Woosh-VFlow-8s/config.yaml
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
exclude_from_checkpoint: false
|
| 2 |
+
trainable: true
|
| 3 |
+
model_type: VideoKontextLDM
|
| 4 |
+
ldm:
|
| 5 |
+
exclude_from_checkpoint: false
|
| 6 |
+
trainable: true
|
| 7 |
+
dit:
|
| 8 |
+
model_type: mmmssflux
|
| 9 |
+
max_description_length: 77
|
| 10 |
+
max_seq_len: 501
|
| 11 |
+
rope_len_multiplier: 2
|
| 12 |
+
dim: 1024
|
| 13 |
+
inter_dim: 4096
|
| 14 |
+
fixed_timestep_features: false
|
| 15 |
+
timestep_features_dim: 256
|
| 16 |
+
n_layers: 12
|
| 17 |
+
n_heads: 8
|
| 18 |
+
n_multimodal_layers: 6
|
| 19 |
+
qk_nope_head_dim: 16
|
| 20 |
+
qk_rope_head_dim: 112
|
| 21 |
+
qkv_head_dim: 128
|
| 22 |
+
n_memory_tokens_rope: 1
|
| 23 |
+
n_memory_tokens_description: 0
|
| 24 |
+
original_seq_len: 501
|
| 25 |
+
rope_theta: 10000.0
|
| 26 |
+
rope_factor: 40.0
|
| 27 |
+
beta_fast: 32
|
| 28 |
+
beta_slow: 1
|
| 29 |
+
io_channels: 128
|
| 30 |
+
cond_token_dim: 1024
|
| 31 |
+
adaln_last_layer: true
|
| 32 |
+
adaln_last_layer_nomod: false
|
| 33 |
+
non_checkpoint_layers: 14
|
| 34 |
+
mask_out_before: -1
|
| 35 |
+
estimate_logvar: true
|
| 36 |
+
no_description_mask: true
|
| 37 |
+
symmetric_attention_init: false
|
| 38 |
+
patch_size: 1
|
| 39 |
+
num_sinks: 0
|
| 40 |
+
mlp_act: gelu
|
| 41 |
+
conditioners:
|
| 42 |
+
text:
|
| 43 |
+
exclude_from_checkpoint: true
|
| 44 |
+
trainable: false
|
| 45 |
+
path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/TextConditionerV
|
| 46 |
+
autoencoder:
|
| 47 |
+
exclude_from_checkpoint: true
|
| 48 |
+
trainable: false
|
| 49 |
+
path: D:/ComfyUI_windows_portable_nvidia/ComfyUI_windows_portable_nvidia_cu128/ComfyUI_windows_portable/ComfyUI/models/woosh/Woosh-AE
|
| 50 |
+
sigma_data: 1.0
|
| 51 |
+
pred_type: v_pred
|
| 52 |
+
audio_fps: 100
|
| 53 |
+
video_fps: 24
|
| 54 |
+
embed_dim: 768
|
| 55 |
+
embed_key: synch_out
|
| 56 |
+
pts_seconds_key: synch_pts_seconds
|
| 57 |
+
non_checkpoint_layers: 14
|
| 58 |
+
n_layers_encoder: 0
|
| 59 |
+
trainable_no_cond: false
|
| 60 |
+
use_batch_mask: true
|
Woosh-VFlow-8s/weights.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed2e7639e830060e532c955d4b4dc23869c8574605267846fa326c28730fcc7d
|
| 3 |
+
size 1654350276
|