Upload folder using huggingface_hub
Browse files- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/checkpoint.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/checkpoint_.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/config.yaml +271 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/eval_results.csv +66 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/log.txt +0 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/model.txt +56 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/slurm.sh +22 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_10000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_100000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_110000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_120000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_130000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_140000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_150000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_160000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_170000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_180000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_190000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_20000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_200000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_210000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_220000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_230000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_240000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_250000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_260000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_270000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_280000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_290000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_30000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_300000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_310000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_320000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_40000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_50000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_60000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_70000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_80000.pt +3 -0
- exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_90000.pt +3 -0
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/checkpoint.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1eeb3becf23eef7cf10ba771a341c1eaebf8ead9e71719398c6d2bccbad629fc
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/checkpoint_.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1eeb3becf23eef7cf10ba771a341c1eaebf8ead9e71719398c6d2bccbad629fc
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/config.yaml
ADDED
|
@@ -0,0 +1,271 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
run_dir: exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs
|
| 2 |
+
seed: 0
|
| 3 |
+
allow_tf32: true
|
| 4 |
+
timeout: null
|
| 5 |
+
resolution: 256
|
| 6 |
+
amp: bf16
|
| 7 |
+
cfg_scale: 1.0
|
| 8 |
+
evaluate_split: test
|
| 9 |
+
eval_dir_name: null
|
| 10 |
+
num_save_images: 64
|
| 11 |
+
save_all_images: false
|
| 12 |
+
save_image_format: jpg
|
| 13 |
+
save_images_at_all_procs: false
|
| 14 |
+
save_latent_samples: false
|
| 15 |
+
latent_samples_dir: null
|
| 16 |
+
evaluate_dataset: sample_class
|
| 17 |
+
sample_class:
|
| 18 |
+
name: SampleClass
|
| 19 |
+
batch_size: 128
|
| 20 |
+
n_worker: 8
|
| 21 |
+
drop_last: false
|
| 22 |
+
seed: 0
|
| 23 |
+
shuffle: false
|
| 24 |
+
num_classes: 1000
|
| 25 |
+
num_samples: 50000
|
| 26 |
+
autoencoder:
|
| 27 |
+
num_settings: 1
|
| 28 |
+
name: dc-ae-f32c32-in-1.0-256px
|
| 29 |
+
scaling_factor: 0.3285
|
| 30 |
+
latent_channels: null
|
| 31 |
+
autoencoder_dtype: fp32
|
| 32 |
+
eval_autoencoder_setting_list: null
|
| 33 |
+
model: fp8coat_dit
|
| 34 |
+
dit:
|
| 35 |
+
name: DiT
|
| 36 |
+
in_channels: 32
|
| 37 |
+
input_size: 8
|
| 38 |
+
cfg_channels: null
|
| 39 |
+
pretrained_path: null
|
| 40 |
+
pretrained_source: dc-ae
|
| 41 |
+
train_scheduler: SiTSampler
|
| 42 |
+
eval_scheduler: ODE_heun2
|
| 43 |
+
num_inference_steps: 30
|
| 44 |
+
flow_shift: 3.0
|
| 45 |
+
reverse_time: false
|
| 46 |
+
use_cads: false
|
| 47 |
+
cads_noise_scale: 0.1
|
| 48 |
+
cads_mixing_factor: 1.0
|
| 49 |
+
cads_tau_min: 0.2
|
| 50 |
+
cads_tau_max: 0.9
|
| 51 |
+
use_guidance_interval: false
|
| 52 |
+
guidance_t_min: 0.2
|
| 53 |
+
guidance_t_max: 0.8
|
| 54 |
+
count_nfe: false
|
| 55 |
+
patch_size: 1
|
| 56 |
+
hidden_size: 1152
|
| 57 |
+
depth: 28
|
| 58 |
+
num_heads: 16
|
| 59 |
+
mlp_ratio: 4.0
|
| 60 |
+
post_norm: false
|
| 61 |
+
class_dropout_prob: 0.1
|
| 62 |
+
num_classes: 1000
|
| 63 |
+
learn_sigma: false
|
| 64 |
+
unconditional: false
|
| 65 |
+
use_checkpoint: true
|
| 66 |
+
adaptive_channel: false
|
| 67 |
+
adaptive_channel_share_weights: true
|
| 68 |
+
only_load_backbone: false
|
| 69 |
+
freeze_backbone: false
|
| 70 |
+
uvit:
|
| 71 |
+
name: UViT
|
| 72 |
+
in_channels: 4
|
| 73 |
+
input_size: 32
|
| 74 |
+
cfg_channels: null
|
| 75 |
+
pretrained_path: null
|
| 76 |
+
pretrained_source: dc-ae
|
| 77 |
+
train_scheduler: DPM_Solver
|
| 78 |
+
eval_scheduler: DPM_Solver
|
| 79 |
+
num_inference_steps: 30
|
| 80 |
+
flow_shift: 3.0
|
| 81 |
+
reverse_time: false
|
| 82 |
+
use_cads: false
|
| 83 |
+
cads_noise_scale: 0.1
|
| 84 |
+
cads_mixing_factor: 1.0
|
| 85 |
+
cads_tau_min: 0.2
|
| 86 |
+
cads_tau_max: 0.9
|
| 87 |
+
use_guidance_interval: false
|
| 88 |
+
guidance_t_min: 0.2
|
| 89 |
+
guidance_t_max: 0.8
|
| 90 |
+
count_nfe: false
|
| 91 |
+
patch_size: 2
|
| 92 |
+
hidden_size: 1152
|
| 93 |
+
depth: 28
|
| 94 |
+
num_heads: 16
|
| 95 |
+
mlp_ratio: 4.0
|
| 96 |
+
mlp_time_embed: false
|
| 97 |
+
qkv_bias: false
|
| 98 |
+
act_layer: gelu
|
| 99 |
+
use_checkpoint: true
|
| 100 |
+
class_dropout_prob: 0.1
|
| 101 |
+
num_classes: 1000
|
| 102 |
+
attn_mode: null
|
| 103 |
+
sana_cls:
|
| 104 |
+
name: SanaCls
|
| 105 |
+
in_channels: 4
|
| 106 |
+
input_size: 32
|
| 107 |
+
cfg_channels: null
|
| 108 |
+
pretrained_path: null
|
| 109 |
+
pretrained_source: dc-ae
|
| 110 |
+
train_scheduler: SanaScheduler
|
| 111 |
+
eval_scheduler: SanaScheduler
|
| 112 |
+
num_inference_steps: 250
|
| 113 |
+
flow_shift: 3.0
|
| 114 |
+
reverse_time: false
|
| 115 |
+
use_cads: false
|
| 116 |
+
cads_noise_scale: 0.1
|
| 117 |
+
cads_mixing_factor: 1.0
|
| 118 |
+
cads_tau_min: 0.2
|
| 119 |
+
cads_tau_max: 0.9
|
| 120 |
+
use_guidance_interval: false
|
| 121 |
+
guidance_t_min: 0.2
|
| 122 |
+
guidance_t_max: 0.8
|
| 123 |
+
count_nfe: false
|
| 124 |
+
patch_size: 2
|
| 125 |
+
hidden_size: 1152
|
| 126 |
+
depth: 28
|
| 127 |
+
num_heads: 16
|
| 128 |
+
mlp_ratio: 4.0
|
| 129 |
+
post_norm: false
|
| 130 |
+
class_dropout_prob: 0.1
|
| 131 |
+
num_classes: 1000
|
| 132 |
+
unconditional: false
|
| 133 |
+
use_checkpoint: true
|
| 134 |
+
only_load_backbone: false
|
| 135 |
+
freeze_backbone: false
|
| 136 |
+
learn_sigma: false
|
| 137 |
+
usana_cls:
|
| 138 |
+
name: USanaCls
|
| 139 |
+
in_channels: 4
|
| 140 |
+
input_size: 32
|
| 141 |
+
cfg_channels: null
|
| 142 |
+
pretrained_path: null
|
| 143 |
+
pretrained_source: dc-ae
|
| 144 |
+
train_scheduler: DPM_Solver
|
| 145 |
+
eval_scheduler: DPM_Solver
|
| 146 |
+
num_inference_steps: 30
|
| 147 |
+
flow_shift: 3.0
|
| 148 |
+
reverse_time: false
|
| 149 |
+
use_cads: false
|
| 150 |
+
cads_noise_scale: 0.1
|
| 151 |
+
cads_mixing_factor: 1.0
|
| 152 |
+
cads_tau_min: 0.2
|
| 153 |
+
cads_tau_max: 0.9
|
| 154 |
+
use_guidance_interval: false
|
| 155 |
+
guidance_t_min: 0.2
|
| 156 |
+
guidance_t_max: 0.8
|
| 157 |
+
count_nfe: false
|
| 158 |
+
patch_size: 2
|
| 159 |
+
hidden_size: 1152
|
| 160 |
+
depth: 28
|
| 161 |
+
num_heads: 16
|
| 162 |
+
mlp_ratio: 4.0
|
| 163 |
+
mlp_time_embed: false
|
| 164 |
+
qkv_bias: false
|
| 165 |
+
act_layer: gelu
|
| 166 |
+
use_checkpoint: true
|
| 167 |
+
class_dropout_prob: 0.1
|
| 168 |
+
num_classes: 1000
|
| 169 |
+
num_training_steps: 1000
|
| 170 |
+
fp8:
|
| 171 |
+
name: FP8DiT
|
| 172 |
+
fp8coat:
|
| 173 |
+
name: FP8COATDiT
|
| 174 |
+
qchoice: linear
|
| 175 |
+
symm: true
|
| 176 |
+
row_blocksize: -1
|
| 177 |
+
col_blocksize: -1
|
| 178 |
+
linear_row_blocksize: 1
|
| 179 |
+
linear_col_blocksize: 16
|
| 180 |
+
min_blockunit_row: -1
|
| 181 |
+
min_blockunit_col: -1
|
| 182 |
+
fabit: NVE2M1_plus
|
| 183 |
+
fwbit: NVE2M1_plus
|
| 184 |
+
babit: NVE2M1_plus
|
| 185 |
+
bwbit: NVE2M1_plus
|
| 186 |
+
bobit: NVE2M1_plus
|
| 187 |
+
epsilon: 1.0e-08
|
| 188 |
+
compute_fid: true
|
| 189 |
+
fid:
|
| 190 |
+
save_path: null
|
| 191 |
+
ref_path: assets/data/fid/imagenet_train_256.npz
|
| 192 |
+
precision_recall_ref_path: assets/data/precision_recall/VIRTUAL_imagenet256.npy
|
| 193 |
+
compute_inception_score: true
|
| 194 |
+
inception_score: {}
|
| 195 |
+
compute_cmmd: true
|
| 196 |
+
cmmd:
|
| 197 |
+
save_path: null
|
| 198 |
+
ref_path: assets/data/cmmd/VIRTUAL_imagenet256.npy
|
| 199 |
+
verbose: false
|
| 200 |
+
train_dataset: latent_imagenet
|
| 201 |
+
latent_imagenet:
|
| 202 |
+
name: LatentImageNet
|
| 203 |
+
batch_size: 128
|
| 204 |
+
n_worker: 8
|
| 205 |
+
drop_last: true
|
| 206 |
+
seed: 0
|
| 207 |
+
shuffle: true
|
| 208 |
+
data_dir: assets/data/latent/dc_ae_f32c32_in_1.0_256px/imagenet_256
|
| 209 |
+
latent_mjhq:
|
| 210 |
+
name: LatentMJHQ
|
| 211 |
+
batch_size: 32
|
| 212 |
+
n_worker: 8
|
| 213 |
+
drop_last: true
|
| 214 |
+
seed: 0
|
| 215 |
+
shuffle: true
|
| 216 |
+
data_dir: assets/data/latent/dc_ae_f32c32/mjhq_1024
|
| 217 |
+
latent_ffhq:
|
| 218 |
+
name: LatentFFHQ
|
| 219 |
+
batch_size: 32
|
| 220 |
+
n_worker: 8
|
| 221 |
+
drop_last: true
|
| 222 |
+
seed: 0
|
| 223 |
+
shuffle: true
|
| 224 |
+
data_dir: assets/data/latent/dc_ae_f32c32/ffhq_1024
|
| 225 |
+
latent_mapillary_vistas:
|
| 226 |
+
name: LatentMapillaryVistas
|
| 227 |
+
batch_size: 32
|
| 228 |
+
n_worker: 8
|
| 229 |
+
drop_last: true
|
| 230 |
+
seed: 0
|
| 231 |
+
shuffle: true
|
| 232 |
+
data_dir: assets/data/latent/dc_ae_f32c32/mapillary_vistas_2048
|
| 233 |
+
latent_multiple_channel_imagenet:
|
| 234 |
+
name: LatentMultipleChannelImageNet
|
| 235 |
+
batch_size: 32
|
| 236 |
+
n_worker: 8
|
| 237 |
+
drop_last: true
|
| 238 |
+
seed: 0
|
| 239 |
+
shuffle: true
|
| 240 |
+
dataset_sample_ratio: null
|
| 241 |
+
num_channels_list: null
|
| 242 |
+
data_dirs:
|
| 243 |
+
- assets/data/latent/dc_ae_f32c32/imagenet_512
|
| 244 |
+
resume: true
|
| 245 |
+
resume_path: null
|
| 246 |
+
resume_schedule: true
|
| 247 |
+
num_epochs: null
|
| 248 |
+
max_steps: 500000
|
| 249 |
+
clip_grad: null
|
| 250 |
+
num_store_images: 64
|
| 251 |
+
save_checkpoint_steps: 1000
|
| 252 |
+
eval_steps: 5000
|
| 253 |
+
save_eval_checkpoint_steps: 5000
|
| 254 |
+
optimizer:
|
| 255 |
+
name: adamw
|
| 256 |
+
lr: 0.0001
|
| 257 |
+
warmup_lr: 0.0
|
| 258 |
+
weight_decay: 0.0
|
| 259 |
+
no_wd_keys: []
|
| 260 |
+
betas:
|
| 261 |
+
- 0.9
|
| 262 |
+
- 0.999
|
| 263 |
+
lr_scheduler:
|
| 264 |
+
name: constant
|
| 265 |
+
warmup_steps: 1000
|
| 266 |
+
log: true
|
| 267 |
+
wandb_entity: han2024
|
| 268 |
+
wandb_project: dc_ae_diffusion
|
| 269 |
+
ema_decay: 0.9999
|
| 270 |
+
ema_warmup_steps: 2000
|
| 271 |
+
eval_ema: true
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/eval_results.csv
ADDED
|
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
,fid,precision,recall,inception_score_mean,inception_score_std,cmmd
|
| 2 |
+
step_100000_autoencoder_setting_0_cfg_1.0,33.510336098973255,0.5956599712371826,0.590499997138977,40.09199964690056,0.9867992039804704,0.7789134979248047
|
| 3 |
+
step_10000_autoencoder_setting_0_cfg_1.0,73.90192494885156,0.3162199854850769,0.4894999861717224,16.27740383148511,0.277950106876481,1.399517059326172
|
| 4 |
+
step_105000_autoencoder_setting_0_cfg_1.0,31.99571309674724,0.5994799733161926,0.5982999801635742,41.5446583047944,1.30438414051274,0.7535219192504883
|
| 5 |
+
step_110000_autoencoder_setting_0_cfg_1.0,31.084778234585315,0.5984399914741516,0.601099967956543,42.81673014675415,1.5925164937267593,0.742793083190918
|
| 6 |
+
step_115000_autoencoder_setting_0_cfg_1.0,30.33861512746074,0.6003199815750122,0.5972999930381775,43.67173277929832,1.539747753303912,0.7289648056030273
|
| 7 |
+
step_120000_autoencoder_setting_0_cfg_1.0,29.81009036379396,0.6003999710083008,0.5971999764442444,44.458882738338936,1.4739077247965764,0.7200241088867188
|
| 8 |
+
step_125000_autoencoder_setting_0_cfg_1.0,29.73945936977003,0.6030799746513367,0.606499969959259,44.74414435290523,1.5099839204816552,0.7243156433105469
|
| 9 |
+
step_130000_autoencoder_setting_0_cfg_1.0,29.537084774585367,0.6041199564933777,0.6071999669075012,45.32032085365301,1.39568082828115,0.7216930389404297
|
| 10 |
+
step_135000_autoencoder_setting_0_cfg_1.0,29.25035165062644,0.6070399880409241,0.6010000109672546,45.46803598120924,1.4409735875031866,0.7151365280151367
|
| 11 |
+
step_140000_autoencoder_setting_0_cfg_1.0,28.90444763476665,0.6025800108909607,0.6018999814987183,45.597290577183394,1.354427855562807,0.705718994140625
|
| 12 |
+
step_145000_autoencoder_setting_0_cfg_1.0,28.324674606056703,0.5902799963951111,0.6071999669075012,45.27874221411236,1.2957470338039971,0.6810426712036133
|
| 13 |
+
step_150000_autoencoder_setting_0_cfg_1.0,28.60110797450659,0.593459963798523,0.60589998960495,44.78194086301391,1.0435081908498076,0.6895065307617188
|
| 14 |
+
step_15000_autoencoder_setting_0_cfg_1.0,64.54487122268665,0.3500599861145019,0.5184000134468079,18.398179969907577,0.3522202054306349,1.2390613555908203
|
| 15 |
+
step_155000_autoencoder_setting_0_cfg_1.0,31.95065719292052,0.5965200066566467,0.6033999919891357,42.916075059198,1.159331511129437,0.7718801498413086
|
| 16 |
+
step_160000_autoencoder_setting_0_cfg_1.0,30.68422348806098,0.5986599922180176,0.5945999622344971,44.20955327758968,1.2711748786662864,0.7419586181640625
|
| 17 |
+
step_165000_autoencoder_setting_0_cfg_1.0,33.47219299450978,0.581279993057251,0.5963000059127808,42.17644170524565,1.007066066336716,0.8236169815063477
|
| 18 |
+
step_170000_autoencoder_setting_0_cfg_1.0,31.89318713646309,0.5908799767494202,0.5875999927520752,44.09051651132943,1.041214600139548,0.7936954498291016
|
| 19 |
+
step_175000_autoencoder_setting_0_cfg_1.0,28.059225943542003,0.6118999719619751,0.5924000144004822,47.0833547422664,1.02520082053524,0.6825923919677734
|
| 20 |
+
step_180000_autoencoder_setting_0_cfg_1.0,26.86359682215533,0.6198199987411499,0.5871999859809875,48.460707615613806,1.276621065770431,0.643610954284668
|
| 21 |
+
step_185000_autoencoder_setting_0_cfg_1.0,23.19771411477757,0.6177999973297119,0.5781999826431274,52.37679030752452,1.3017335985986096,0.5334615707397461
|
| 22 |
+
step_190000_autoencoder_setting_0_cfg_1.0,29.17611684625689,0.5356199741363525,0.5751999616622925,46.47262300749968,0.9186686723855764,0.6437301635742188
|
| 23 |
+
step_195000_autoencoder_setting_0_cfg_1.0,29.543687644147496,0.5321199893951416,0.5625999569892883,46.76187865714515,1.1099872913116335,0.6268024444580078
|
| 24 |
+
step_200000_autoencoder_setting_0_cfg_1.0,23.80048736942706,0.5858399868011475,0.5575000047683716,58.942239278429554,1.817286785028792,0.5916357040405273
|
| 25 |
+
step_20000_autoencoder_setting_0_cfg_1.0,59.71597046734888,0.3647599816322326,0.5491999983787537,19.74359432040311,0.450373075317894,1.1576414108276367
|
| 26 |
+
step_205000_autoencoder_setting_0_cfg_1.0,22.12023671548451,0.6092000007629395,0.5795999765396118,61.177534212409455,1.3219201412613395,0.5767345428466797
|
| 27 |
+
step_210000_autoencoder_setting_0_cfg_1.0,24.4272912625878,0.6003199815750122,0.5756999850273132,55.205168250673225,1.5699953835294218,0.5776882171630859
|
| 28 |
+
step_215000_autoencoder_setting_0_cfg_1.0,26.145530498882465,0.5882599949836731,0.5619999766349792,52.5792564803152,0.9331772645925596,0.583648681640625
|
| 29 |
+
step_220000_autoencoder_setting_0_cfg_1.0,33.717075840811106,0.5693599581718445,0.5706999897956848,41.55646637019326,0.7472119125007876,0.6976127624511719
|
| 30 |
+
step_225000_autoencoder_setting_0_cfg_1.0,37.75270042779056,0.5680400133132935,0.5640000104904175,37.35837407110965,0.9174423982675206,0.7526874542236328
|
| 31 |
+
step_230000_autoencoder_setting_0_cfg_1.0,41.80794911337364,0.5369600057601929,0.5568000078201294,34.946629068675506,0.7575486856087463,0.8826255798339844
|
| 32 |
+
step_235000_autoencoder_setting_0_cfg_1.0,35.97322463757547,0.5503199696540833,0.5562999844551086,40.24203779016634,1.1283857749401949,0.7938146591186523
|
| 33 |
+
step_240000_autoencoder_setting_0_cfg_1.0,35.63028665616923,0.5603799819946289,0.5485000014305115,41.24571541034057,1.0281156165647911,0.7764101028442383
|
| 34 |
+
step_245000_autoencoder_setting_0_cfg_1.0,30.2209251885713,0.5829600095748901,0.5669999718666077,47.19632009902397,1.1179175794254577,0.6849765777587891
|
| 35 |
+
step_250000_autoencoder_setting_0_cfg_1.0,28.80573283180962,0.6025999784469604,0.5428000092506409,48.640761477471074,0.8757591899906153,0.6220340728759766
|
| 36 |
+
step_25000_autoencoder_setting_0_cfg_1.0,57.00759901774785,0.3761000037193298,0.5557999610900879,20.628880517156603,0.3562785811510151,1.1113882064819336
|
| 37 |
+
step_255000_autoencoder_setting_0_cfg_1.0,31.98233728231185,0.5830399990081787,0.5428000092506409,43.99541556516653,1.0652455905332407,0.6737709045410156
|
| 38 |
+
step_260000_autoencoder_setting_0_cfg_1.0,31.68354833974729,0.5862199664115906,0.552299976348877,43.2768589576001,0.9986364453619164,0.6620883941650391
|
| 39 |
+
step_265000_autoencoder_setting_0_cfg_1.0,31.50612363132126,0.5783999562263489,0.5652999877929688,43.98134720708489,0.9954869364396132,0.681757926940918
|
| 40 |
+
step_270000_autoencoder_setting_0_cfg_1.0,31.68609210507236,0.571619987487793,0.5719999670982361,43.15291995516085,0.8036755546675325,0.6895065307617188
|
| 41 |
+
step_275000_autoencoder_setting_0_cfg_1.0,29.74582904389871,0.585860013961792,0.5733999609947205,45.70878680122093,0.9328789651107372,0.6787776947021484
|
| 42 |
+
step_280000_autoencoder_setting_0_cfg_1.0,28.08477422446685,0.5943199992179871,0.5595999956130981,47.97159710271989,0.934454655944602,0.6558895111083984
|
| 43 |
+
step_285000_autoencoder_setting_0_cfg_1.0,37.16351652347868,0.5593599677085876,0.5462999939918518,38.821064409111735,0.8984244883954947,0.7899999618530273
|
| 44 |
+
step_290000_autoencoder_setting_0_cfg_1.0,35.13686225649491,0.5741400122642517,0.5638999938964844,39.28087561670991,1.1236658537717517,0.7501840591430664
|
| 45 |
+
step_295000_autoencoder_setting_0_cfg_1.0,33.163526727613714,0.5811600089073181,0.5708000063896179,41.46022925753859,1.0585913435556151,0.7112026214599609
|
| 46 |
+
step_300000_autoencoder_setting_0_cfg_1.0,38.86992745092755,0.5604599714279175,0.5561000108718872,36.608194517420586,0.7411830008857224,0.8028745651245117
|
| 47 |
+
step_30000_autoencoder_setting_0_cfg_1.0,55.00772555796266,0.3881599903106689,0.5625,21.4777448838741,0.3303526685224319,1.0881423950195312
|
| 48 |
+
step_305000_autoencoder_setting_0_cfg_1.0,40.654731308000805,0.5505399703979492,0.5654999613761902,34.86966265090955,0.664410489582783,0.8350610733032227
|
| 49 |
+
step_310000_autoencoder_setting_0_cfg_1.0,37.667755599753264,0.5451200008392334,0.560699999332428,36.70080426804611,0.8777978541854278,0.7804632186889648
|
| 50 |
+
step_315000_autoencoder_setting_0_cfg_1.0,41.79937248106677,0.5360599756240845,0.5679999589920044,33.45560467093258,0.8521028202931553,0.8482933044433594
|
| 51 |
+
step_320000_autoencoder_setting_0_cfg_1.0,51.47804312534464,0.4896599948406219,0.5291000008583069,28.043407163850866,0.4270782284876955,1.0304450988769531
|
| 52 |
+
step_325000_autoencoder_setting_0_cfg_1.0,48.228641188953134,0.495419979095459,0.5407999753952026,28.574792479385394,0.40829275689333416,0.9474754333496094
|
| 53 |
+
step_35000_autoencoder_setting_0_cfg_1.0,53.2382308378962,0.4078599810600281,0.5694999694824219,22.289185030567616,0.3048117845165478,1.0652542114257812
|
| 54 |
+
step_40000_autoencoder_setting_0_cfg_1.0,51.75855118114072,0.4341999888420105,0.576200008392334,23.356298751607465,0.4521947034097131,1.049637794494629
|
| 55 |
+
step_45000_autoencoder_setting_0_cfg_1.0,50.30115830364991,0.4549599885940552,0.5882999897003174,24.55035109111102,0.5621372832031544,1.0350942611694336
|
| 56 |
+
step_50000_autoencoder_setting_0_cfg_1.0,48.415261502685325,0.4780399799346924,0.5922999978065491,25.98636236345556,0.6534759089226885,1.019001007080078
|
| 57 |
+
step_5000_autoencoder_setting_0_cfg_1.0,89.0873257052084,0.2642599940299988,0.4005999863147735,13.879401738049452,0.281824832227157,1.6162395477294922
|
| 58 |
+
step_55000_autoencoder_setting_0_cfg_1.0,46.70711673379924,0.5,0.5934999585151672,27.346334763245828,0.7571752924388021,0.9958744049072266
|
| 59 |
+
step_60000_autoencoder_setting_0_cfg_1.0,45.71089146050844,0.5166000127792358,0.5879999995231628,28.46846628558452,0.8322938709885304,0.982046127319336
|
| 60 |
+
step_65000_autoencoder_setting_0_cfg_1.0,45.76202067657903,0.5302199721336365,0.5907999873161316,28.90117178672436,0.7314161581733065,0.9901523590087892
|
| 61 |
+
step_70000_autoencoder_setting_0_cfg_1.0,46.257953874742896,0.5351399779319763,0.5892999768257141,29.143563631670304,0.6718447316445654,1.000165939331055
|
| 62 |
+
step_75000_autoencoder_setting_0_cfg_1.0,45.70217787873264,0.5448399782180786,0.5879999995231628,29.95001729137772,0.6204188052274286,0.9901523590087892
|
| 63 |
+
step_80000_autoencoder_setting_0_cfg_1.0,43.23189977289189,0.5568000078201294,0.5814999938011169,31.8562303396425,0.6517948737403826,0.9478330612182616
|
| 64 |
+
step_85000_autoencoder_setting_0_cfg_1.0,40.700212981158586,0.5700399875640869,0.5794000029563904,33.96066291911782,0.7829944264755757,0.9067058563232422
|
| 65 |
+
step_90000_autoencoder_setting_0_cfg_1.0,37.9045656958437,0.5823400020599365,0.5852000117301941,36.2067636052034,0.8642681408317301,0.859379768371582
|
| 66 |
+
step_95000_autoencoder_setting_0_cfg_1.0,35.42743405262286,0.5922600030899048,0.5907999873161316,38.43274352690076,0.9939473698385852,0.8138418197631836
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/log.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/model.txt
ADDED
|
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FP8COATDiT(
|
| 2 |
+
(x_embedder): PatchEmbed(
|
| 3 |
+
(proj): Conv2d(32, 1152, kernel_size=(1, 1), stride=(1, 1))
|
| 4 |
+
(norm): Identity()
|
| 5 |
+
)
|
| 6 |
+
(t_embedder): TimestepEmbedder(
|
| 7 |
+
(mlp): Sequential(
|
| 8 |
+
(0): Linear(in_features=256, out_features=1152, bias=True)
|
| 9 |
+
(1): SiLU()
|
| 10 |
+
(2): Linear(in_features=1152, out_features=1152, bias=True)
|
| 11 |
+
)
|
| 12 |
+
)
|
| 13 |
+
(y_embedder): LabelEmbedder(
|
| 14 |
+
(embedding_table): Embedding(1001, 1152)
|
| 15 |
+
)
|
| 16 |
+
(blocks): ModuleList(
|
| 17 |
+
(0-27): 28 x FP8COATDiTBlock(
|
| 18 |
+
(norm1): LayerNorm((1152,), eps=1e-06, elementwise_affine=False)
|
| 19 |
+
(attn): FP8COATAttention(
|
| 20 |
+
(qkv): QAct_Linear(in_features=1152, out_features=3456, bias=True)
|
| 21 |
+
(q_norm): Identity()
|
| 22 |
+
(k_norm): Identity()
|
| 23 |
+
(attn_drop): Dropout(p=0.0, inplace=False)
|
| 24 |
+
(proj): QAct_Linear(in_features=1152, out_features=1152, bias=True)
|
| 25 |
+
(proj_drop): Dropout(p=0.0, inplace=False)
|
| 26 |
+
(qact_q_quantize): QAct_Quantize()
|
| 27 |
+
(qact_k_quantize): QAct_Quantize()
|
| 28 |
+
)
|
| 29 |
+
(norm2): LayerNorm((1152,), eps=1e-06, elementwise_affine=False)
|
| 30 |
+
(mlp): FP8COATMlp(
|
| 31 |
+
(fc1): QAct_Linear(in_features=1152, out_features=4608, bias=True)
|
| 32 |
+
(act): GELU(approximate='tanh')
|
| 33 |
+
(drop1): Dropout(p=0, inplace=False)
|
| 34 |
+
(norm): Identity()
|
| 35 |
+
(fc2): QAct_Linear(in_features=4608, out_features=1152, bias=True)
|
| 36 |
+
(drop2): Dropout(p=0, inplace=False)
|
| 37 |
+
(qact_quantize_gelu): QAct_Quantize()
|
| 38 |
+
(qact_quantize_norm): QAct_Quantize()
|
| 39 |
+
)
|
| 40 |
+
(adaLN_modulation): Sequential(
|
| 41 |
+
(0): SiLU()
|
| 42 |
+
(1): Linear(in_features=1152, out_features=6912, bias=True)
|
| 43 |
+
)
|
| 44 |
+
(qact_quantize_norm1): QAct_Quantize()
|
| 45 |
+
(qact_quantize_norm2): QAct_Quantize()
|
| 46 |
+
)
|
| 47 |
+
)
|
| 48 |
+
(final_layer): FinalLayer(
|
| 49 |
+
(norm_final): LayerNorm((1152,), eps=1e-06, elementwise_affine=False)
|
| 50 |
+
(linear): Linear(in_features=1152, out_features=32, bias=True)
|
| 51 |
+
(adaLN_modulation): Sequential(
|
| 52 |
+
(0): SiLU()
|
| 53 |
+
(1): Linear(in_features=1152, out_features=2304, bias=True)
|
| 54 |
+
)
|
| 55 |
+
)
|
| 56 |
+
)
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/slurm.sh
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/bin/bash
|
| 2 |
+
#SBATCH -A nvr_elm_llm #account
|
| 3 |
+
#SBATCH -p grizzly,polar,polar3,polar4 #partition
|
| 4 |
+
#SBATCH -t 04:00:00 #wall time limit, hr:min:sec
|
| 5 |
+
#SBATCH -N 1 #number of nodes
|
| 6 |
+
#SBATCH -J train_diffusion_dit #job name
|
| 7 |
+
#SBATCH --array=1-40%1
|
| 8 |
+
#SBATCH --output=exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/slurm_out/%A_%a.out
|
| 9 |
+
#SBATCH --gpus-per-node 8
|
| 10 |
+
#SBATCH --exclusive
|
| 11 |
+
|
| 12 |
+
export LOGLEVEL=INFO
|
| 13 |
+
export PATH="/home/hcai/workspace/anaconda3/envs/efficientvit/bin:$PATH"
|
| 14 |
+
|
| 15 |
+
cd /lustre/fs12/portfolios/nvr/users/hcai/workspace/code/fp8-dit
|
| 16 |
+
|
| 17 |
+
read -r -d '' cmd <<EOF
|
| 18 |
+
torchrun --nnodes=1 --nproc_per_node=8 \
|
| 19 |
+
-m efficientvit.diffusioncore.trainer yaml=exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/config.yaml
|
| 20 |
+
EOF
|
| 21 |
+
|
| 22 |
+
srun bash -c "${cmd}"
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_10000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5c5bb545904a239de8f521663812ac7251083e529da23038eea8f66f1d060e4
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_100000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acb05c7f16b847ab2936468f9fc1f454d9d06088a085a65755e3d40d5f2ad141
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_110000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d23b86d2dd89509f5d8f3bda36e2bd6a853fa1fb4dd59d3a72f55331567a410d
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_120000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:433a1058c76d1b4190adc95ef74a80fcc3c3d5cabcea766780ecb2129bce0eaf
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_130000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01fc27c9a4a09993de336940f00835f5f968f10ce8c80a442cf97a35d24fccc4
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_140000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5c9c1a571e7d06bb7b44cbb228adc63729b64c0e52ce9fe422074adf727c2a6
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_150000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:906ebdbd8001cc1d936ddc96e7aa5d8728f05430fef70bd1aa8afbc3c37a4107
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_160000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:757b030bd3a01e91d44c06e2f74a02948b0cbe119db78abece769cda01e238c0
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_170000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ab243dbc84422cbf0e1e60ef00355bc36b4d4c66ddf7183ef5669a0ebfda31f
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_180000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b7457b65143646607cc416b1100115a2ad0c3c4ae51363782d3abb3c8a2be7a
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_190000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:def7cb742808cc31d7ab449b93906860e98e0809bc31839ed47bbad686e11d90
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_20000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bf02564af0398cf2c9c4cc472dc7f7330dece479b16b192b5d1a709b860d3d6
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_200000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37e362264c1577d556ecf9a3dcfbeab5058ee5f2f0100e4357595197fa5028f9
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_210000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d09e7a11e741b66ae60bb90d01e234acc1ac9302ab3da2932bc1eda8ed336721
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_220000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c7b7022e75604a64cc0f5479fda031a53ab0a7d572667831fce80bb76f16fbb
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_230000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:add18ed428ec88d55e50d8f7499c6918841d1c10145aa62c6c5b23e1bad24272
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_240000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7477a0a93284aa65443d688bf0f0c81ee38938912b0d376821745018de0daa95
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_250000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:535a80cfd49cf5fd1989663cb56a376c1285206e1e2f640688f1fe4a5161fb0b
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_260000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5274a705a81546ca85e6438521ad9730709d094c2bf8f6c9e5f0bddcd39da76b
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_270000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f088038b7fb222eb7e84c6f56c760593f6dcdaa623879f48c2e831b5650528ce
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_280000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e0abeabd6df1d609033faa56c00cb68a90fcfaccbb481c057c1a3ae329a2365
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_290000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66041402fd5a1f6b31a7e348a93175f02f0a6f352a7144b65c720e2531d4022a
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_30000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f183ce76386cbe85a51b2697cf9a8acdbf66125483c56f01ee05e2d478d6793
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_300000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fdabf13c5caeeabbc8f69c8c72f20174eded6fc3f156efddf8bfd7f8f26f5db2
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_310000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1bd03471b5a0944df91d3372f022dd0ae50c3cb1cb6628a14b5c8491682b1d5
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_320000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d55dae96f32fe096e6a7216e38459f9fb69108f0f638b7ecdb78714e14922e26
|
| 3 |
+
size 10798884178
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_40000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b6b6587df87505136f72bb381730d842e38eb8e1b7d72ea7be5db01ddd43f16
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_50000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4119fce107052e095fde8fab41d3abd787eeda6a6161c837edeaa2d82a5f8ce
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_60000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04e29cd1127aad857ac04f39c310ab731b72bd0dcb5c20b68d1c42b3e705aecd
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_70000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ab32060789ef30f00e65d7e6c4fd131204e020af887d3dd93af2189a04cdfea
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_80000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f024a85fb8cd370d5146fddad5515f7e0233effbb6101b8fa17612fb5d9c7054
|
| 3 |
+
size 10798882714
|
exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/nvfp4_e2m1_plus_cs/step_90000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd060761647e0ca085781bb91ab2ff6166438991cde333fba957f713e6ffd34f
|
| 3 |
+
size 10798882714
|