ChenYi99 commited on 21 days ago

Commit

d3b0f6e

verified ·

1 Parent(s): 90cdace

Upload folder using huggingface_hub

Browse files

Files changed (19) hide show

.gitignore +5 -0
DIAL-3B-fewshot/config.json +93 -0
DIAL-3B-fewshot/experiment_cfg/metadata.json +0 -0
DIAL-3B-fewshot/model-00001-of-00005.safetensors +3 -0
DIAL-3B-fewshot/model-00002-of-00005.safetensors +3 -0
DIAL-3B-fewshot/model-00003-of-00005.safetensors +3 -0
DIAL-3B-fewshot/model-00004-of-00005.safetensors +3 -0
DIAL-3B-fewshot/model-00005-of-00005.safetensors +3 -0
DIAL-3B-fewshot/model.safetensors.index.json +0 -0
DIAL-3B-fewshot/trainer_state.json +0 -0
DIAL-3B-fulldata/config.json +93 -0
DIAL-3B-fulldata/experiment_cfg/metadata.json +0 -0
DIAL-3B-fulldata/model-00001-of-00005.safetensors +3 -0
DIAL-3B-fulldata/model-00002-of-00005.safetensors +3 -0
DIAL-3B-fulldata/model-00003-of-00005.safetensors +3 -0
DIAL-3B-fulldata/model-00004-of-00005.safetensors +3 -0
DIAL-3B-fulldata/model-00005-of-00005.safetensors +3 -0
DIAL-3B-fulldata/model.safetensors.index.json +0 -0
DIAL-3B-fulldata/trainer_state.json +0 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,5 @@

+# 1. 排除带 _wrong 后缀的一级子目录 (末尾加/代表目录)
+/*_wrong/
+# 2. 排除带 evaluation 前缀的二级子目录
+/*/evaluation*/

DIAL-3B-fewshot/config.json ADDED Viewed

	@@ -0,0 +1,93 @@

+{
+  "action_dim": 128,
+  "action_head_cfg": {
+    "action_dim": 128,
+    "action_horizon": 16,
+    "add_pos_embed": true,
+    "backbone_embedding_dim": 2048,
+    "correct_vl_mask": false,
+    "diffusion_model_cfg": {
+      "attention_head_dim": 48,
+      "cross_attention_dim": 2048,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "interleave_self_attention": true,
+      "norm_type": "ada_norm",
+      "num_attention_heads": 32,
+      "num_layers": 16,
+      "output_dim": 1024,
+      "positional_embeddings": null
+    },
+    "hidden_size": 1024,
+    "input_embedding_dim": 1536,
+    "max_action_dim": 128,
+    "max_state_dim": 128,
+    "model_dtype": "float32",
+    "noise_beta_alpha": 1.5,
+    "noise_beta_beta": 1.0,
+    "noise_s": 0.999,
+    "num_inference_timesteps": 4,
+    "num_target_vision_tokens": 0,
+    "num_timestep_buckets": 1000,
+    "tune_diffusion_model": true,
+    "tune_projector": true,
+    "use_vl_mask": false,
+    "use_vlln": true,
+    "vl_self_attention_cfg": {
+      "attention_head_dim": 64,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "num_attention_heads": 32,
+      "num_layers": 4,
+      "positional_embeddings": null
+    }
+  },
+  "action_horizon": 16,
+  "architectures": [
+    "GR00T_N1_5_DIAL"
+  ],
+  "attn_implementation": null,
+  "backbone_cfg": {
+    "load_bf16": false,
+    "project_to_dim": null,
+    "reproject_vision": false,
+    "select_layer": 36,
+    "tune_all_llm_embedding": false,
+    "tune_bridge_embedding": true,
+    "tune_llm": true,
+    "tune_visual": false,
+    "use_flash_attention": true,
+    "vlm_path": "Qwen/Qwen2.5-VL-3B-Instruct"
+  },
+  "bridge_cfg": {
+    "action_only_one_obs": false,
+    "bridge_loss_decay_steps": null,
+    "bridge_loss_end_w": null,
+    "bridge_loss_type": "mse",
+    "bridge_type": "end2end",
+    "compute_bridge_loss": true,
+    "goal_image_type": "future",
+    "noise_tau": 0,
+    "num_bridge_tokens": 64,
+    "omit_image_type_embedding_for_goal": false,
+    "reweight_noise": false,
+    "tokenizer_len": 151729,
+    "tune_bridge_goal": false,
+    "tune_bridge_visual": false,
+    "tune_image_type_embedding": true,
+    "unified_embodiment_id": 24,
+    "use_bridge": true,
+    "use_image_type_embedding": true,
+    "use_separate_projector_for_loss": true
+  },
+  "compute_dtype": "bfloat16",
+  "hidden_size": 2048,
+  "ignore_lang_prefix": true,
+  "model_dtype": "float32",
+  "model_type": "gr00t_n1_5_dial",
+  "torch_dtype": "float32",
+  "transformers_version": "4.52.0",
+  "video_delta_indices": [
+    0
+  ]
+}

DIAL-3B-fewshot/experiment_cfg/metadata.json ADDED Viewed

The diff for this file is too large to render. See raw diff

DIAL-3B-fewshot/model-00001-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef4245d424bc0b0fd5be6e2376f731005ea2f6e671f5b351a41c90b51bf76b47
+size 4972313024

DIAL-3B-fewshot/model-00002-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66cbc3dc6a4eb9dbf6bd7c87b485da71230b0c05c116d3d0228e76b26a4aea5a
+size 4932954592

DIAL-3B-fewshot/model-00003-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4af0074f406239f95f4763423f310ec2c5276e8bcf5414b9edc99e02ca3b1665
+size 4932954680

DIAL-3B-fewshot/model-00004-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe8e39ceca3753aabe113e72aca191b3b57d4c6083046b92de5d1f34fb7c8bbf
+size 4993877584

DIAL-3B-fewshot/model-00005-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7cda9532379532b982d26d02b08aa505dee6409b0fbad9056a323acd6b374fa1
+size 2243381472

DIAL-3B-fewshot/model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

DIAL-3B-fewshot/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

DIAL-3B-fulldata/config.json ADDED Viewed

	@@ -0,0 +1,93 @@

+{
+  "action_dim": 128,
+  "action_head_cfg": {
+    "action_dim": 128,
+    "action_horizon": 16,
+    "add_pos_embed": true,
+    "backbone_embedding_dim": 2048,
+    "correct_vl_mask": false,
+    "diffusion_model_cfg": {
+      "attention_head_dim": 48,
+      "cross_attention_dim": 2048,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "interleave_self_attention": true,
+      "norm_type": "ada_norm",
+      "num_attention_heads": 32,
+      "num_layers": 16,
+      "output_dim": 1024,
+      "positional_embeddings": null
+    },
+    "hidden_size": 1024,
+    "input_embedding_dim": 1536,
+    "max_action_dim": 128,
+    "max_state_dim": 128,
+    "model_dtype": "float32",
+    "noise_beta_alpha": 1.5,
+    "noise_beta_beta": 1.0,
+    "noise_s": 0.999,
+    "num_inference_timesteps": 4,
+    "num_target_vision_tokens": 0,
+    "num_timestep_buckets": 1000,
+    "tune_diffusion_model": true,
+    "tune_projector": true,
+    "use_vl_mask": false,
+    "use_vlln": true,
+    "vl_self_attention_cfg": {
+      "attention_head_dim": 64,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "num_attention_heads": 32,
+      "num_layers": 4,
+      "positional_embeddings": null
+    }
+  },
+  "action_horizon": 16,
+  "architectures": [
+    "GR00T_N1_5_DIAL"
+  ],
+  "attn_implementation": null,
+  "backbone_cfg": {
+    "load_bf16": false,
+    "project_to_dim": null,
+    "reproject_vision": false,
+    "select_layer": 36,
+    "tune_all_llm_embedding": false,
+    "tune_bridge_embedding": true,
+    "tune_llm": true,
+    "tune_visual": false,
+    "use_flash_attention": true,
+    "vlm_path": "Qwen/Qwen2.5-VL-3B-Instruct"
+  },
+  "bridge_cfg": {
+    "action_only_one_obs": false,
+    "bridge_loss_decay_steps": null,
+    "bridge_loss_end_w": null,
+    "bridge_loss_type": "mse",
+    "bridge_type": "end2end",
+    "compute_bridge_loss": true,
+    "goal_image_type": "future",
+    "noise_tau": 0,
+    "num_bridge_tokens": 64,
+    "omit_image_type_embedding_for_goal": false,
+    "reweight_noise": false,
+    "tokenizer_len": 151729,
+    "tune_bridge_goal": false,
+    "tune_bridge_visual": false,
+    "tune_image_type_embedding": true,
+    "unified_embodiment_id": null,
+    "use_bridge": true,
+    "use_image_type_embedding": true,
+    "use_separate_projector_for_loss": true
+  },
+  "compute_dtype": "bfloat16",
+  "hidden_size": 2048,
+  "ignore_lang_prefix": true,
+  "model_dtype": "float32",
+  "model_type": "gr00t_n1_5_dial",
+  "torch_dtype": "float32",
+  "transformers_version": "4.52.0",
+  "video_delta_indices": [
+    0
+  ]
+}

DIAL-3B-fulldata/experiment_cfg/metadata.json ADDED Viewed

The diff for this file is too large to render. See raw diff

DIAL-3B-fulldata/model-00001-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e953ca78ef7420f59e66ed55be71c8e13386330fa019eb3a90ed8611e5e9b9a
+size 4972313024

DIAL-3B-fulldata/model-00002-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:75907124b1c46b02a5a0933757dccbe274e22e6eb617eaff2c1dbb9751511278
+size 4932954592

DIAL-3B-fulldata/model-00003-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8561a67a505c4ec674760690bedc257ffbe8f0810e007109b48cc22e460e6809
+size 4932954680

DIAL-3B-fulldata/model-00004-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:705baaa44572307e4068da7a814dbff170a7cb7ed4f45b43a3cd7e9d38e349fb
+size 4993877584

DIAL-3B-fulldata/model-00005-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:384d6d9e2e1019bfdf8a1ee998ae93bc50d189e7377f5b1b6587e8e7119238bf
+size 2243381472

DIAL-3B-fulldata/model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

DIAL-3B-fulldata/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff