SsharvienKumar commited on 13 days ago

Commit

5e081ca

verified ·

1 Parent(s): 1bce491

Upload 28 files

Browse files

Files changed (28) hide show

checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/controlnet/config.json +77 -0
checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/controlnet/diffusion_pytorch_model.safetensors +3 -0
checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/optimizer.bin +3 -0
checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/random_states_0.pkl +3 -0
checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/scheduler.bin +3 -0
checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/controlnet/config.json +76 -0
checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/controlnet/diffusion_pytorch_model.safetensors +3 -0
checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/optimizer.bin +3 -0
checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/random_states_0.pkl +3 -0
checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/scheduler.bin +3 -0
checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/optimizer.bin +3 -0
checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/random_states_0.pkl +3 -0
checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/scheduler.bin +3 -0
checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/unet/config.json +79 -0
checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/optimizer.bin +3 -0
checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/random_states_0.pkl +3 -0
checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/scheduler.bin +3 -0
checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/unet/config.json +79 -0
checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoints/Cataract-1K/graphencoder_masked/best_val_loss.pth +3 -0
checkpoints/Cataract-1K/graphencoder_segclip/best_val_loss.pth +3 -0
checkpoints/Cataract-1K/vae_vid_diffusion/vae/config.json +37 -0
checkpoints/Cataract-1K/vae_vid_diffusion/vae/diffusion_pytorch_model.safetensors +3 -0
checkpoints/Cataract-1K/vqgan_image/checkpoint.ckpt +3 -0
checkpoints/Cataract-1K/vqgan_image/config.yaml +57 -0
checkpoints/Cataract-1K/vqgan_segmentation/checkpoint.ckpt +3 -0
checkpoints/Cataract-1K/vqgan_segmentation/config.yaml +52 -0

checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/controlnet/config.json ADDED Viewed

	@@ -0,0 +1,77 @@

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.21.2",
+  "_name_or_path": "./checkpoints/Cataract-1k/video_diffusion/surgsimbridge_training_img_graph_vid_cataract1k-2026-04-15T07-35-15/checkpoints/checkpoint-145000",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": [
+    5,
+    10,
+    20,
+    20
+  ],
+  "attention_type": "default",
+  "augment_temporal_attention": true,
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "class_embed_type": "identity",
+  "class_embeddings_concat": true,
+  "conditioning_channels": 3,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "conv_in_kernel": 3,
+  "cross_attention_dim": 1024,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "first_frame_condition_mode": "concat",
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "global_pool_conditions": false,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "n_frames": 16,
+  "n_temp_heads": 8,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "temp_pos_embedding": "rotary",
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": 512,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "upcast_attention": false,
+  "use_frame_stride_condition": false,
+  "use_linear_projection": true,
+  "use_temporal": true
+}

checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/controlnet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:820df30af2eb1f58e7482527ba44e6f032b207aa8158d2316bcd556c976ddc28
+size 2102262840

checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8354bc5f78800d0550eb25175805b996820198d470e8dd8d94b1f66af130d61b
+size 4165435906

checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:496c5491d5471c8b259125aac6d453c89b669f87e41cb199b7cdac71d09de86f
+size 15060

checkpoints/Cataract-1K/controlnet_img_graph_vid/checkpoint/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eaa9a799183c7caa950febe94a4dab7ab200474b49179a367833ffed6b68d3c1
+size 1000

checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/controlnet/config.json ADDED Viewed

	@@ -0,0 +1,76 @@

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.21.2",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": [
+    5,
+    10,
+    20,
+    20
+  ],
+  "attention_type": "default",
+  "augment_temporal_attention": true,
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "class_embed_type": "identity",
+  "class_embeddings_concat": true,
+  "conditioning_channels": 3,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "conv_in_kernel": 3,
+  "cross_attention_dim": 1024,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "first_frame_condition_mode": "none",
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "global_pool_conditions": false,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "n_frames": 16,
+  "n_temp_heads": 8,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "temp_pos_embedding": "rotary",
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": 512,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "upcast_attention": false,
+  "use_frame_stride_condition": false,
+  "use_linear_projection": true,
+  "use_temporal": true
+}

checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/controlnet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:859a5b41e7b2044c643f6677da64ed4dd7b1220e2de20c6a29b4b89cabab4ef1
+size 2102262840

checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8045adfdaa09aa28b1fa7c556aaa02714d3e0244a78e401e74206b9b5b9c6e69
+size 4165427650

checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ebb76978b0d6edffa23a13921f66f7f593a0b46ede1ede4cc8dc2e7fd7b3e11
+size 15060

checkpoints/Cataract-1K/controlnet_ximg_graph_vid/checkpoint/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:532bd73f2b1d01dc0536daabcec58f40e379e94a680763a6e8bc6c9fc3e6d1c8
+size 1000

checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:415b91ff1fe392da4416455500da6eb8d67edefdaf13408c838df9e03dbdb79e
+size 9847488907

checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c063c9a457d2f978404daef7c46ab0170e4a81320bd443c6daf6eb1b2dc483d3
+size 15124

checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94f607683c090632e8d779f519774dd0a2133d20ff4299b9edecbd7b1661901e
+size 1000

checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/unet/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "_class_name": "VideoLDMUNet3DConditionModel",
+  "_diffusers_version": "0.21.2",
+  "_name_or_path": "/gris/gris-f/homestud/ssivakum/SurgSimBridge_Gen/checkpoints/Cataract-1k/video_diffusion/surgsimbridge_training_img_graph_xvid_cataract1k-2026-03-26T20-30-27/checkpoints/checkpoint-245000",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": [
+    5,
+    10,
+    20,
+    20
+  ],
+  "attention_type": "default",
+  "augment_temporal_attention": true,
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": "identity",
+  "class_embeddings_concat": true,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 1024,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "first_frame_condition_mode": "concat",
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "n_frames": 16,
+  "n_temp_heads": 8,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "sample_size": 64,
+  "temp_pos_embedding": "rotary",
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": 512,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_frame_stride_condition": false,
+  "use_linear_projection": true,
+  "use_temporal": true
+}

checkpoints/Cataract-1K/diffusion_img_graph_xvid/checkpoint/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e5fd513ed200886c036a1da211a097784942a73340d9ddde34645aade9b64d8
+size 4964732628

checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:37d6c917c05ab185f9d47db0e4fbb96b1c5ce2d47e0cf3ef4f2c01f427f9e1b4
+size 9847488907

checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ce6f7a255ed67162de7f4c95beb6c09c9276622d1c43ff280d3c1c1120500cc
+size 15060

checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f84e5f00e0f88087868886d1779ea0db653ba13f6a46103160bf4e63f9d73045
+size 1000

checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/unet/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "_class_name": "VideoLDMUNet3DConditionModel",
+  "_diffusers_version": "0.21.2",
+  "_name_or_path": "/gris/gris-f/homestud/ssivakum/SurgSimBridge_Gen/checkpoints/Cataract-1k/video_diffusion/surgsimbridge_training_ximg_graph_xvid_cataract1k-2026-03-29T17-21-00/checkpoints/checkpoint-240000",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": [
+    5,
+    10,
+    20,
+    20
+  ],
+  "attention_type": "default",
+  "augment_temporal_attention": true,
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": "identity",
+  "class_embeddings_concat": true,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 1024,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "first_frame_condition_mode": "none",
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "n_frames": 16,
+  "n_temp_heads": 8,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "sample_size": 64,
+  "temp_pos_embedding": "rotary",
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": 512,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_frame_stride_condition": false,
+  "use_linear_projection": true,
+  "use_temporal": true
+}

checkpoints/Cataract-1K/diffusion_ximg_graph_xvid/checkpoint/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7b626c753583df2dcbcab69355cb4769876782d990e97b169168195ad66e2e8
+size 4964732628

checkpoints/Cataract-1K/graphencoder_masked/best_val_loss.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60850527fd42a58b8422c757abfd72198e4b7602d757b74ba14480fc26fa2f86
+size 350312386

checkpoints/Cataract-1K/graphencoder_segclip/best_val_loss.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:63e107df17abb7ae93f6e9f0e7c2192b1e0026de83e75c64f8b14d6bf9332e6c
+size 277281262

checkpoints/Cataract-1K/vae_vid_diffusion/vae/config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.31.0",
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": true,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "latents_mean": null,
+  "latents_std": null,
+  "layers_per_block": 2,
+  "mid_block_add_attention": true,
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 512,
+  "scaling_factor": 0.18215,
+  "shift_factor": null,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ],
+  "use_post_quant_conv": true,
+  "use_quant_conv": true
+}

checkpoints/Cataract-1K/vae_vid_diffusion/vae/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c092d4ddabf78277ce148cf7cbaf7f115119ef79b352a1a44d86f697f7052d51
+size 334643268

checkpoints/Cataract-1K/vqgan_image/checkpoint.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b02b93c343804b00d63ea69003490a27a7d3bb61825fbfa374c1a8ba14ff1ed
+size 878907278

checkpoints/Cataract-1K/vqgan_image/config.yaml ADDED Viewed

	@@ -0,0 +1,57 @@

+model:
+  base_learning_rate: 4.5e-06
+  target: surgsimbridge.taming.taming.models.vqgan.VQModel
+  params:
+    embed_dim: 1
+    n_embed: 16384
+    image_key: image
+    ddconfig:
+      double_z: false
+      z_channels: 1
+      resolution: 128
+      in_channels: 3
+      out_ch: 3
+      ch: 128
+      ch_mult:
+      - 1
+      - 2
+      - 2
+      - 4
+      num_res_blocks: 2
+      attn_resolutions:
+      - 16
+      dropout: 0.0
+    lossconfig:
+      target: surgsimbridge.taming.taming.modules.losses.vqperceptual.VQLPIPSWithDiscriminator
+      params:
+        disc_conditional: false
+        disc_in_channels: 3
+        disc_num_layers: 2
+        disc_start: 1
+        disc_weight: 0.6
+        codebook_weight: 1.0
+data:
+  target: main.DataModuleFromConfig
+  params:
+    batch_size: 16
+    num_workers: 16
+    train:
+      target: surgsimbridge.taming.taming.data.surgicaldataset.CataractTrain
+      params:
+        size: 128
+        num_label: 14
+        augment: true
+        txt_file:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K/splits/train.txt
+        data_root:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K
+    validation:
+      target: surgsimbridge.taming.taming.data.surgicaldataset.CataractValidation
+      params:
+        size: 128
+        num_label: 14
+        augment: false
+        txt_file:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K/splits/val.txt
+        data_root:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K

checkpoints/Cataract-1K/vqgan_segmentation/checkpoint.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df08b568767b66d718678837320f822184a98d3fd4d1194250cc43b34d77bd17
+size 812256860

checkpoints/Cataract-1K/vqgan_segmentation/config.yaml ADDED Viewed

	@@ -0,0 +1,52 @@

+model:
+  base_learning_rate: 4.5e-06
+  target: surgsimbridge.taming.taming.models.vqgan.VQSegmentationModel
+  params:
+    embed_dim: 1
+    n_embed: 8192
+    image_key: segmentation
+    ddconfig:
+      double_z: false
+      z_channels: 1
+      resolution: 128
+      in_channels: 14
+      out_ch: 14
+      ch: 128
+      ch_mult:
+      - 1
+      - 2
+      - 2
+      - 4
+      num_res_blocks: 2
+      attn_resolutions:
+      - 16
+      dropout: 0.0
+    lossconfig:
+      target: surgsimbridge.taming.taming.modules.losses.segmentation.BCELossWithQuant
+      params:
+        codebook_weight: 1.0
+data:
+  target: main.DataModuleFromConfig
+  params:
+    batch_size: 16
+    num_workers: 16
+    train:
+      target: surgsimbridge.taming.taming.data.surgicaldataset.CataractTrain
+      params:
+        size: 128
+        num_label: 14
+        augment: true
+        txt_file:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K/splits/train.txt
+        data_root:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K
+    validation:
+      target: surgsimbridge.taming.taming.data.surgicaldataset.CataractValidation
+      params:
+        size: 128
+        num_label: 14
+        augment: false
+        txt_file:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K/splits/val.txt
+        data_root:
+        - /gris/scratch-gris-filesrv/sharvien/SurgSimBridge/Cataract-1K