Upload 22 files
Browse files- .gitattributes +5 -0
- ddpm_variance_22/checkpoint_epoch_19/config.json +74 -0
- ddpm_variance_22/checkpoint_epoch_19/diffusion_pytorch_model.safetensors +3 -0
- ddpm_variance_22/checkpoint_epoch_19/label_proj.pt +3 -0
- ddpm_variance_22/checkpoint_epoch_29/config.json +74 -0
- ddpm_variance_22/checkpoint_epoch_29/diffusion_pytorch_model.safetensors +3 -0
- ddpm_variance_22/checkpoint_epoch_29/label_proj.pt +3 -0
- ddpm_variance_22/checkpoint_epoch_39/config.json +74 -0
- ddpm_variance_22/checkpoint_epoch_39/diffusion_pytorch_model.safetensors +3 -0
- ddpm_variance_22/checkpoint_epoch_39/label_proj.pt +3 -0
- ddpm_variance_22/checkpoint_epoch_49/config.json +74 -0
- ddpm_variance_22/checkpoint_epoch_49/diffusion_pytorch_model.safetensors +3 -0
- ddpm_variance_22/checkpoint_epoch_49/label_proj.pt +3 -0
- ddpm_variance_22/checkpoint_epoch_9/config.json +74 -0
- ddpm_variance_22/checkpoint_epoch_9/diffusion_pytorch_model.safetensors +3 -0
- ddpm_variance_22/checkpoint_epoch_9/label_proj.pt +3 -0
- ddpm_variance_22/loss_curve.png +0 -0
- ddpm_variance_22/sample_epoch_19.png +3 -0
- ddpm_variance_22/sample_epoch_29.png +3 -0
- ddpm_variance_22/sample_epoch_39.png +3 -0
- ddpm_variance_22/sample_epoch_49.png +3 -0
- ddpm_variance_22/sample_epoch_9.png +3 -0
- ddpm_variance_22/train_log.txt +50 -0
.gitattributes
CHANGED
|
@@ -41,3 +41,8 @@ ddpm-udder-results6/sample_epoch_029.png filter=lfs diff=lfs merge=lfs -text
|
|
| 41 |
ddpm-udder-results6/sample_epoch_059.png filter=lfs diff=lfs merge=lfs -text
|
| 42 |
ddpm-udder-results6/sample_epoch_089.png filter=lfs diff=lfs merge=lfs -text
|
| 43 |
ddpm-udder-results6/sample_epoch_119.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 41 |
ddpm-udder-results6/sample_epoch_059.png filter=lfs diff=lfs merge=lfs -text
|
| 42 |
ddpm-udder-results6/sample_epoch_089.png filter=lfs diff=lfs merge=lfs -text
|
| 43 |
ddpm-udder-results6/sample_epoch_119.png filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
ddpm_variance_22/sample_epoch_19.png filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
ddpm_variance_22/sample_epoch_29.png filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
ddpm_variance_22/sample_epoch_39.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
ddpm_variance_22/sample_epoch_49.png filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
ddpm_variance_22/sample_epoch_9.png filter=lfs diff=lfs merge=lfs -text
|
ddpm_variance_22/checkpoint_epoch_19/config.json
ADDED
|
@@ -0,0 +1,74 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "UNet2DConditionModel",
|
| 3 |
+
"_diffusers_version": "0.36.0",
|
| 4 |
+
"_name_or_path": "ddpm_variance_21\\checkpoint_epoch_49",
|
| 5 |
+
"act_fn": "silu",
|
| 6 |
+
"addition_embed_type": null,
|
| 7 |
+
"addition_embed_type_num_heads": 64,
|
| 8 |
+
"addition_time_embed_dim": null,
|
| 9 |
+
"attention_head_dim": 32,
|
| 10 |
+
"attention_type": "default",
|
| 11 |
+
"block_out_channels": [
|
| 12 |
+
128,
|
| 13 |
+
128,
|
| 14 |
+
256,
|
| 15 |
+
256,
|
| 16 |
+
512,
|
| 17 |
+
512
|
| 18 |
+
],
|
| 19 |
+
"center_input_sample": false,
|
| 20 |
+
"class_embed_type": null,
|
| 21 |
+
"class_embeddings_concat": false,
|
| 22 |
+
"conv_in_kernel": 3,
|
| 23 |
+
"conv_out_kernel": 3,
|
| 24 |
+
"cross_attention_dim": 256,
|
| 25 |
+
"cross_attention_norm": null,
|
| 26 |
+
"down_block_types": [
|
| 27 |
+
"DownBlock2D",
|
| 28 |
+
"DownBlock2D",
|
| 29 |
+
"CrossAttnDownBlock2D",
|
| 30 |
+
"CrossAttnDownBlock2D",
|
| 31 |
+
"DownBlock2D",
|
| 32 |
+
"DownBlock2D"
|
| 33 |
+
],
|
| 34 |
+
"downsample_padding": 1,
|
| 35 |
+
"dropout": 0.2,
|
| 36 |
+
"dual_cross_attention": false,
|
| 37 |
+
"encoder_hid_dim": null,
|
| 38 |
+
"encoder_hid_dim_type": null,
|
| 39 |
+
"flip_sin_to_cos": true,
|
| 40 |
+
"freq_shift": 0,
|
| 41 |
+
"in_channels": 3,
|
| 42 |
+
"layers_per_block": 2,
|
| 43 |
+
"mid_block_only_cross_attention": null,
|
| 44 |
+
"mid_block_scale_factor": 1,
|
| 45 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 46 |
+
"norm_eps": 1e-05,
|
| 47 |
+
"norm_num_groups": 32,
|
| 48 |
+
"num_attention_heads": null,
|
| 49 |
+
"num_class_embeds": null,
|
| 50 |
+
"only_cross_attention": false,
|
| 51 |
+
"out_channels": 6,
|
| 52 |
+
"projection_class_embeddings_input_dim": null,
|
| 53 |
+
"resnet_out_scale_factor": 1.0,
|
| 54 |
+
"resnet_skip_time_act": false,
|
| 55 |
+
"resnet_time_scale_shift": "default",
|
| 56 |
+
"reverse_transformer_layers_per_block": null,
|
| 57 |
+
"sample_size": 256,
|
| 58 |
+
"time_cond_proj_dim": null,
|
| 59 |
+
"time_embedding_act_fn": null,
|
| 60 |
+
"time_embedding_dim": null,
|
| 61 |
+
"time_embedding_type": "positional",
|
| 62 |
+
"timestep_post_act": null,
|
| 63 |
+
"transformer_layers_per_block": 1,
|
| 64 |
+
"up_block_types": [
|
| 65 |
+
"UpBlock2D",
|
| 66 |
+
"UpBlock2D",
|
| 67 |
+
"CrossAttnUpBlock2D",
|
| 68 |
+
"CrossAttnUpBlock2D",
|
| 69 |
+
"UpBlock2D",
|
| 70 |
+
"UpBlock2D"
|
| 71 |
+
],
|
| 72 |
+
"upcast_attention": false,
|
| 73 |
+
"use_linear_projection": false
|
| 74 |
+
}
|
ddpm_variance_22/checkpoint_epoch_19/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:154ef01fd951d54753d0f4e79209f0fa39c338d23ee8999dd02653cb6a2dc35c
|
| 3 |
+
size 509495352
|
ddpm_variance_22/checkpoint_epoch_19/label_proj.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c5a19a487b8e046f574b44b5046595f59b72ccd5eafd9f01d4e758bbfadcac7
|
| 3 |
+
size 4745337
|
ddpm_variance_22/checkpoint_epoch_29/config.json
ADDED
|
@@ -0,0 +1,74 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "UNet2DConditionModel",
|
| 3 |
+
"_diffusers_version": "0.36.0",
|
| 4 |
+
"_name_or_path": "ddpm_variance_21\\checkpoint_epoch_49",
|
| 5 |
+
"act_fn": "silu",
|
| 6 |
+
"addition_embed_type": null,
|
| 7 |
+
"addition_embed_type_num_heads": 64,
|
| 8 |
+
"addition_time_embed_dim": null,
|
| 9 |
+
"attention_head_dim": 32,
|
| 10 |
+
"attention_type": "default",
|
| 11 |
+
"block_out_channels": [
|
| 12 |
+
128,
|
| 13 |
+
128,
|
| 14 |
+
256,
|
| 15 |
+
256,
|
| 16 |
+
512,
|
| 17 |
+
512
|
| 18 |
+
],
|
| 19 |
+
"center_input_sample": false,
|
| 20 |
+
"class_embed_type": null,
|
| 21 |
+
"class_embeddings_concat": false,
|
| 22 |
+
"conv_in_kernel": 3,
|
| 23 |
+
"conv_out_kernel": 3,
|
| 24 |
+
"cross_attention_dim": 256,
|
| 25 |
+
"cross_attention_norm": null,
|
| 26 |
+
"down_block_types": [
|
| 27 |
+
"DownBlock2D",
|
| 28 |
+
"DownBlock2D",
|
| 29 |
+
"CrossAttnDownBlock2D",
|
| 30 |
+
"CrossAttnDownBlock2D",
|
| 31 |
+
"DownBlock2D",
|
| 32 |
+
"DownBlock2D"
|
| 33 |
+
],
|
| 34 |
+
"downsample_padding": 1,
|
| 35 |
+
"dropout": 0.2,
|
| 36 |
+
"dual_cross_attention": false,
|
| 37 |
+
"encoder_hid_dim": null,
|
| 38 |
+
"encoder_hid_dim_type": null,
|
| 39 |
+
"flip_sin_to_cos": true,
|
| 40 |
+
"freq_shift": 0,
|
| 41 |
+
"in_channels": 3,
|
| 42 |
+
"layers_per_block": 2,
|
| 43 |
+
"mid_block_only_cross_attention": null,
|
| 44 |
+
"mid_block_scale_factor": 1,
|
| 45 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 46 |
+
"norm_eps": 1e-05,
|
| 47 |
+
"norm_num_groups": 32,
|
| 48 |
+
"num_attention_heads": null,
|
| 49 |
+
"num_class_embeds": null,
|
| 50 |
+
"only_cross_attention": false,
|
| 51 |
+
"out_channels": 6,
|
| 52 |
+
"projection_class_embeddings_input_dim": null,
|
| 53 |
+
"resnet_out_scale_factor": 1.0,
|
| 54 |
+
"resnet_skip_time_act": false,
|
| 55 |
+
"resnet_time_scale_shift": "default",
|
| 56 |
+
"reverse_transformer_layers_per_block": null,
|
| 57 |
+
"sample_size": 256,
|
| 58 |
+
"time_cond_proj_dim": null,
|
| 59 |
+
"time_embedding_act_fn": null,
|
| 60 |
+
"time_embedding_dim": null,
|
| 61 |
+
"time_embedding_type": "positional",
|
| 62 |
+
"timestep_post_act": null,
|
| 63 |
+
"transformer_layers_per_block": 1,
|
| 64 |
+
"up_block_types": [
|
| 65 |
+
"UpBlock2D",
|
| 66 |
+
"UpBlock2D",
|
| 67 |
+
"CrossAttnUpBlock2D",
|
| 68 |
+
"CrossAttnUpBlock2D",
|
| 69 |
+
"UpBlock2D",
|
| 70 |
+
"UpBlock2D"
|
| 71 |
+
],
|
| 72 |
+
"upcast_attention": false,
|
| 73 |
+
"use_linear_projection": false
|
| 74 |
+
}
|
ddpm_variance_22/checkpoint_epoch_29/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b381d506a9802e10d1bcb48e81bf78b9b3908068f431fb6870288d73f936133d
|
| 3 |
+
size 509495352
|
ddpm_variance_22/checkpoint_epoch_29/label_proj.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e32b240bf9d24b4f7d4cef0218224944ce32d8632076fcd8a36deaab3c24568
|
| 3 |
+
size 4745337
|
ddpm_variance_22/checkpoint_epoch_39/config.json
ADDED
|
@@ -0,0 +1,74 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "UNet2DConditionModel",
|
| 3 |
+
"_diffusers_version": "0.36.0",
|
| 4 |
+
"_name_or_path": "ddpm_variance_21\\checkpoint_epoch_49",
|
| 5 |
+
"act_fn": "silu",
|
| 6 |
+
"addition_embed_type": null,
|
| 7 |
+
"addition_embed_type_num_heads": 64,
|
| 8 |
+
"addition_time_embed_dim": null,
|
| 9 |
+
"attention_head_dim": 32,
|
| 10 |
+
"attention_type": "default",
|
| 11 |
+
"block_out_channels": [
|
| 12 |
+
128,
|
| 13 |
+
128,
|
| 14 |
+
256,
|
| 15 |
+
256,
|
| 16 |
+
512,
|
| 17 |
+
512
|
| 18 |
+
],
|
| 19 |
+
"center_input_sample": false,
|
| 20 |
+
"class_embed_type": null,
|
| 21 |
+
"class_embeddings_concat": false,
|
| 22 |
+
"conv_in_kernel": 3,
|
| 23 |
+
"conv_out_kernel": 3,
|
| 24 |
+
"cross_attention_dim": 256,
|
| 25 |
+
"cross_attention_norm": null,
|
| 26 |
+
"down_block_types": [
|
| 27 |
+
"DownBlock2D",
|
| 28 |
+
"DownBlock2D",
|
| 29 |
+
"CrossAttnDownBlock2D",
|
| 30 |
+
"CrossAttnDownBlock2D",
|
| 31 |
+
"DownBlock2D",
|
| 32 |
+
"DownBlock2D"
|
| 33 |
+
],
|
| 34 |
+
"downsample_padding": 1,
|
| 35 |
+
"dropout": 0.2,
|
| 36 |
+
"dual_cross_attention": false,
|
| 37 |
+
"encoder_hid_dim": null,
|
| 38 |
+
"encoder_hid_dim_type": null,
|
| 39 |
+
"flip_sin_to_cos": true,
|
| 40 |
+
"freq_shift": 0,
|
| 41 |
+
"in_channels": 3,
|
| 42 |
+
"layers_per_block": 2,
|
| 43 |
+
"mid_block_only_cross_attention": null,
|
| 44 |
+
"mid_block_scale_factor": 1,
|
| 45 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 46 |
+
"norm_eps": 1e-05,
|
| 47 |
+
"norm_num_groups": 32,
|
| 48 |
+
"num_attention_heads": null,
|
| 49 |
+
"num_class_embeds": null,
|
| 50 |
+
"only_cross_attention": false,
|
| 51 |
+
"out_channels": 6,
|
| 52 |
+
"projection_class_embeddings_input_dim": null,
|
| 53 |
+
"resnet_out_scale_factor": 1.0,
|
| 54 |
+
"resnet_skip_time_act": false,
|
| 55 |
+
"resnet_time_scale_shift": "default",
|
| 56 |
+
"reverse_transformer_layers_per_block": null,
|
| 57 |
+
"sample_size": 256,
|
| 58 |
+
"time_cond_proj_dim": null,
|
| 59 |
+
"time_embedding_act_fn": null,
|
| 60 |
+
"time_embedding_dim": null,
|
| 61 |
+
"time_embedding_type": "positional",
|
| 62 |
+
"timestep_post_act": null,
|
| 63 |
+
"transformer_layers_per_block": 1,
|
| 64 |
+
"up_block_types": [
|
| 65 |
+
"UpBlock2D",
|
| 66 |
+
"UpBlock2D",
|
| 67 |
+
"CrossAttnUpBlock2D",
|
| 68 |
+
"CrossAttnUpBlock2D",
|
| 69 |
+
"UpBlock2D",
|
| 70 |
+
"UpBlock2D"
|
| 71 |
+
],
|
| 72 |
+
"upcast_attention": false,
|
| 73 |
+
"use_linear_projection": false
|
| 74 |
+
}
|
ddpm_variance_22/checkpoint_epoch_39/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:253dbfd0baf1a492e3d2955e2ef4da8cf150de41d079cf623dd73c2762f3a550
|
| 3 |
+
size 509495352
|
ddpm_variance_22/checkpoint_epoch_39/label_proj.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3d426fff2277ba0db3024140aedd99be838fea6f800b04c273dc9f355f5a837
|
| 3 |
+
size 4745337
|
ddpm_variance_22/checkpoint_epoch_49/config.json
ADDED
|
@@ -0,0 +1,74 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "UNet2DConditionModel",
|
| 3 |
+
"_diffusers_version": "0.36.0",
|
| 4 |
+
"_name_or_path": "ddpm_variance_21\\checkpoint_epoch_49",
|
| 5 |
+
"act_fn": "silu",
|
| 6 |
+
"addition_embed_type": null,
|
| 7 |
+
"addition_embed_type_num_heads": 64,
|
| 8 |
+
"addition_time_embed_dim": null,
|
| 9 |
+
"attention_head_dim": 32,
|
| 10 |
+
"attention_type": "default",
|
| 11 |
+
"block_out_channels": [
|
| 12 |
+
128,
|
| 13 |
+
128,
|
| 14 |
+
256,
|
| 15 |
+
256,
|
| 16 |
+
512,
|
| 17 |
+
512
|
| 18 |
+
],
|
| 19 |
+
"center_input_sample": false,
|
| 20 |
+
"class_embed_type": null,
|
| 21 |
+
"class_embeddings_concat": false,
|
| 22 |
+
"conv_in_kernel": 3,
|
| 23 |
+
"conv_out_kernel": 3,
|
| 24 |
+
"cross_attention_dim": 256,
|
| 25 |
+
"cross_attention_norm": null,
|
| 26 |
+
"down_block_types": [
|
| 27 |
+
"DownBlock2D",
|
| 28 |
+
"DownBlock2D",
|
| 29 |
+
"CrossAttnDownBlock2D",
|
| 30 |
+
"CrossAttnDownBlock2D",
|
| 31 |
+
"DownBlock2D",
|
| 32 |
+
"DownBlock2D"
|
| 33 |
+
],
|
| 34 |
+
"downsample_padding": 1,
|
| 35 |
+
"dropout": 0.2,
|
| 36 |
+
"dual_cross_attention": false,
|
| 37 |
+
"encoder_hid_dim": null,
|
| 38 |
+
"encoder_hid_dim_type": null,
|
| 39 |
+
"flip_sin_to_cos": true,
|
| 40 |
+
"freq_shift": 0,
|
| 41 |
+
"in_channels": 3,
|
| 42 |
+
"layers_per_block": 2,
|
| 43 |
+
"mid_block_only_cross_attention": null,
|
| 44 |
+
"mid_block_scale_factor": 1,
|
| 45 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 46 |
+
"norm_eps": 1e-05,
|
| 47 |
+
"norm_num_groups": 32,
|
| 48 |
+
"num_attention_heads": null,
|
| 49 |
+
"num_class_embeds": null,
|
| 50 |
+
"only_cross_attention": false,
|
| 51 |
+
"out_channels": 6,
|
| 52 |
+
"projection_class_embeddings_input_dim": null,
|
| 53 |
+
"resnet_out_scale_factor": 1.0,
|
| 54 |
+
"resnet_skip_time_act": false,
|
| 55 |
+
"resnet_time_scale_shift": "default",
|
| 56 |
+
"reverse_transformer_layers_per_block": null,
|
| 57 |
+
"sample_size": 256,
|
| 58 |
+
"time_cond_proj_dim": null,
|
| 59 |
+
"time_embedding_act_fn": null,
|
| 60 |
+
"time_embedding_dim": null,
|
| 61 |
+
"time_embedding_type": "positional",
|
| 62 |
+
"timestep_post_act": null,
|
| 63 |
+
"transformer_layers_per_block": 1,
|
| 64 |
+
"up_block_types": [
|
| 65 |
+
"UpBlock2D",
|
| 66 |
+
"UpBlock2D",
|
| 67 |
+
"CrossAttnUpBlock2D",
|
| 68 |
+
"CrossAttnUpBlock2D",
|
| 69 |
+
"UpBlock2D",
|
| 70 |
+
"UpBlock2D"
|
| 71 |
+
],
|
| 72 |
+
"upcast_attention": false,
|
| 73 |
+
"use_linear_projection": false
|
| 74 |
+
}
|
ddpm_variance_22/checkpoint_epoch_49/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43f0007ba6f69f479f768f2e39cebb2faf73a7343616b8b658c16fc660d582ec
|
| 3 |
+
size 509495352
|
ddpm_variance_22/checkpoint_epoch_49/label_proj.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35ee5bdd6f6cf8b2a6f6c1813272af47b2cd0069f6f9a26b7a205c6d6241da00
|
| 3 |
+
size 4745337
|
ddpm_variance_22/checkpoint_epoch_9/config.json
ADDED
|
@@ -0,0 +1,74 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "UNet2DConditionModel",
|
| 3 |
+
"_diffusers_version": "0.36.0",
|
| 4 |
+
"_name_or_path": "ddpm_variance_21\\checkpoint_epoch_49",
|
| 5 |
+
"act_fn": "silu",
|
| 6 |
+
"addition_embed_type": null,
|
| 7 |
+
"addition_embed_type_num_heads": 64,
|
| 8 |
+
"addition_time_embed_dim": null,
|
| 9 |
+
"attention_head_dim": 32,
|
| 10 |
+
"attention_type": "default",
|
| 11 |
+
"block_out_channels": [
|
| 12 |
+
128,
|
| 13 |
+
128,
|
| 14 |
+
256,
|
| 15 |
+
256,
|
| 16 |
+
512,
|
| 17 |
+
512
|
| 18 |
+
],
|
| 19 |
+
"center_input_sample": false,
|
| 20 |
+
"class_embed_type": null,
|
| 21 |
+
"class_embeddings_concat": false,
|
| 22 |
+
"conv_in_kernel": 3,
|
| 23 |
+
"conv_out_kernel": 3,
|
| 24 |
+
"cross_attention_dim": 256,
|
| 25 |
+
"cross_attention_norm": null,
|
| 26 |
+
"down_block_types": [
|
| 27 |
+
"DownBlock2D",
|
| 28 |
+
"DownBlock2D",
|
| 29 |
+
"CrossAttnDownBlock2D",
|
| 30 |
+
"CrossAttnDownBlock2D",
|
| 31 |
+
"DownBlock2D",
|
| 32 |
+
"DownBlock2D"
|
| 33 |
+
],
|
| 34 |
+
"downsample_padding": 1,
|
| 35 |
+
"dropout": 0.2,
|
| 36 |
+
"dual_cross_attention": false,
|
| 37 |
+
"encoder_hid_dim": null,
|
| 38 |
+
"encoder_hid_dim_type": null,
|
| 39 |
+
"flip_sin_to_cos": true,
|
| 40 |
+
"freq_shift": 0,
|
| 41 |
+
"in_channels": 3,
|
| 42 |
+
"layers_per_block": 2,
|
| 43 |
+
"mid_block_only_cross_attention": null,
|
| 44 |
+
"mid_block_scale_factor": 1,
|
| 45 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 46 |
+
"norm_eps": 1e-05,
|
| 47 |
+
"norm_num_groups": 32,
|
| 48 |
+
"num_attention_heads": null,
|
| 49 |
+
"num_class_embeds": null,
|
| 50 |
+
"only_cross_attention": false,
|
| 51 |
+
"out_channels": 6,
|
| 52 |
+
"projection_class_embeddings_input_dim": null,
|
| 53 |
+
"resnet_out_scale_factor": 1.0,
|
| 54 |
+
"resnet_skip_time_act": false,
|
| 55 |
+
"resnet_time_scale_shift": "default",
|
| 56 |
+
"reverse_transformer_layers_per_block": null,
|
| 57 |
+
"sample_size": 256,
|
| 58 |
+
"time_cond_proj_dim": null,
|
| 59 |
+
"time_embedding_act_fn": null,
|
| 60 |
+
"time_embedding_dim": null,
|
| 61 |
+
"time_embedding_type": "positional",
|
| 62 |
+
"timestep_post_act": null,
|
| 63 |
+
"transformer_layers_per_block": 1,
|
| 64 |
+
"up_block_types": [
|
| 65 |
+
"UpBlock2D",
|
| 66 |
+
"UpBlock2D",
|
| 67 |
+
"CrossAttnUpBlock2D",
|
| 68 |
+
"CrossAttnUpBlock2D",
|
| 69 |
+
"UpBlock2D",
|
| 70 |
+
"UpBlock2D"
|
| 71 |
+
],
|
| 72 |
+
"upcast_attention": false,
|
| 73 |
+
"use_linear_projection": false
|
| 74 |
+
}
|
ddpm_variance_22/checkpoint_epoch_9/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c36dd1ae1dbccafadc8246d44b581bdadc5b3c36e366221f853ec5754fb5e962
|
| 3 |
+
size 509495352
|
ddpm_variance_22/checkpoint_epoch_9/label_proj.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:272f767c910d38864cc44ed69da94b18894e96c84b2aded6ca868f91f4f01318
|
| 3 |
+
size 4745337
|
ddpm_variance_22/loss_curve.png
ADDED
|
ddpm_variance_22/sample_epoch_19.png
ADDED
|
Git LFS Details
|
ddpm_variance_22/sample_epoch_29.png
ADDED
|
Git LFS Details
|
ddpm_variance_22/sample_epoch_39.png
ADDED
|
Git LFS Details
|
ddpm_variance_22/sample_epoch_49.png
ADDED
|
Git LFS Details
|
ddpm_variance_22/sample_epoch_9.png
ADDED
|
Git LFS Details
|
ddpm_variance_22/train_log.txt
ADDED
|
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Epoch 0: Avg Loss = 0.002801
|
| 2 |
+
Epoch 1: Avg Loss = 0.002913
|
| 3 |
+
Epoch 2: Avg Loss = 0.002975
|
| 4 |
+
Epoch 3: Avg Loss = 0.002920
|
| 5 |
+
Epoch 4: Avg Loss = 0.002960
|
| 6 |
+
Epoch 5: Avg Loss = 0.002998
|
| 7 |
+
Epoch 6: Avg Loss = 0.003006
|
| 8 |
+
Epoch 7: Avg Loss = 0.003139
|
| 9 |
+
Epoch 8: Avg Loss = 0.002932
|
| 10 |
+
Epoch 9: Avg Loss = 0.002993
|
| 11 |
+
Epoch 10: Avg Loss = 0.002844
|
| 12 |
+
Epoch 11: Avg Loss = 0.002919
|
| 13 |
+
Epoch 12: Avg Loss = 0.002828
|
| 14 |
+
Epoch 13: Avg Loss = 0.002726
|
| 15 |
+
Epoch 14: Avg Loss = 0.003037
|
| 16 |
+
Epoch 15: Avg Loss = 0.002925
|
| 17 |
+
Epoch 16: Avg Loss = 0.002997
|
| 18 |
+
Epoch 17: Avg Loss = 0.002893
|
| 19 |
+
Epoch 18: Avg Loss = 0.002877
|
| 20 |
+
Epoch 19: Avg Loss = 0.002762
|
| 21 |
+
Epoch 20: Avg Loss = 0.002785
|
| 22 |
+
Epoch 21: Avg Loss = 0.002974
|
| 23 |
+
Epoch 22: Avg Loss = 0.002737
|
| 24 |
+
Epoch 23: Avg Loss = 0.002930
|
| 25 |
+
Epoch 24: Avg Loss = 0.002861
|
| 26 |
+
Epoch 25: Avg Loss = 0.002713
|
| 27 |
+
Epoch 26: Avg Loss = 0.002752
|
| 28 |
+
Epoch 27: Avg Loss = 0.002806
|
| 29 |
+
Epoch 28: Avg Loss = 0.002667
|
| 30 |
+
Epoch 29: Avg Loss = 0.002830
|
| 31 |
+
Epoch 30: Avg Loss = 0.002617
|
| 32 |
+
Epoch 31: Avg Loss = 0.002775
|
| 33 |
+
Epoch 32: Avg Loss = 0.002752
|
| 34 |
+
Epoch 33: Avg Loss = 0.002571
|
| 35 |
+
Epoch 34: Avg Loss = 0.002799
|
| 36 |
+
Epoch 35: Avg Loss = 0.002668
|
| 37 |
+
Epoch 36: Avg Loss = 0.002780
|
| 38 |
+
Epoch 37: Avg Loss = 0.003050
|
| 39 |
+
Epoch 38: Avg Loss = 0.002495
|
| 40 |
+
Epoch 39: Avg Loss = 0.002875
|
| 41 |
+
Epoch 40: Avg Loss = 0.002622
|
| 42 |
+
Epoch 41: Avg Loss = 0.002495
|
| 43 |
+
Epoch 42: Avg Loss = 0.002506
|
| 44 |
+
Epoch 43: Avg Loss = 0.002664
|
| 45 |
+
Epoch 44: Avg Loss = 0.002622
|
| 46 |
+
Epoch 45: Avg Loss = 0.002644
|
| 47 |
+
Epoch 46: Avg Loss = 0.002844
|
| 48 |
+
Epoch 47: Avg Loss = 0.002589
|
| 49 |
+
Epoch 48: Avg Loss = 0.002789
|
| 50 |
+
Epoch 49: Avg Loss = 0.002641
|