Cognition2ActionLab commited on
Commit
ca3b9b1
·
verified ·
1 Parent(s): 935e526

Upload HEX EAI real-world 2B checkpoint

Browse files
EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2/EAI_real_world.log ADDED
The diff for this file is too large to render. See raw diff
 
EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2/checkpoints/steps_300000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:345ffdda686a5941b6ee0fe4214ed909bdbf7fb2106cdaaef1cfd846be306b2f
3
+ size 5533777864
EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2/config.json ADDED
@@ -0,0 +1,169 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run_id": "hex_ac100_300k_8gpu_state_query_history2",
3
+ "run_root_dir": "./pretrained_models/hex/EAI_real_world_2B",
4
+ "seed": 42,
5
+ "trackers": [
6
+ "jsonl",
7
+ "wandb"
8
+ ],
9
+ "wandb_entity": "HEXTeam",
10
+ "wandb_project": "hex",
11
+ "is_debug": false,
12
+ "enable_mee": false,
13
+ "mee_weight": 0.01,
14
+ "framework": {
15
+ "name": "HEX",
16
+ "qwenvl": {
17
+ "base_vlm": "/mnt/dataset/vnwy44/model/Qwen3-VL-2B-Instruct",
18
+ "attn_implementation": "flash_attention_2",
19
+ "vl_hidden_dim": 2048,
20
+ "add_query": true
21
+ },
22
+ "dino": {
23
+ "dino_backbone": "dinov2_vits14"
24
+ },
25
+ "action_model": {
26
+ "action_model_type": "DiT-B",
27
+ "action_hidden_dim": 2,
28
+ "hidden_size": 1024,
29
+ "add_pos_embed": true,
30
+ "max_seq_len": 1024,
31
+ "action_dim": 32,
32
+ "state_dim": 36,
33
+ "future_action_window_size": 99,
34
+ "action_horizon": 100,
35
+ "past_action_window_size": 0,
36
+ "repeated_diffusion_steps": 8,
37
+ "noise_beta_alpha": 1.5,
38
+ "noise_beta_beta": 1.0,
39
+ "noise_s": 0.999,
40
+ "num_timestep_buckets": 1000,
41
+ "num_inference_timesteps": 4,
42
+ "num_target_vision_tokens": 32,
43
+ "diffusion_model_cfg": {
44
+ "cross_attention_dim": 2048,
45
+ "cross_attention_dim_vl": 2048,
46
+ "cross_attention_dim_state": 768,
47
+ "dropout": 0.2,
48
+ "final_dropout": true,
49
+ "interleave_self_attention": true,
50
+ "norm_type": "ada_norm",
51
+ "num_layers": 16,
52
+ "output_dim": 1024,
53
+ "positional_embeddings": null
54
+ }
55
+ },
56
+ "state_model": {
57
+ "state_horizon": 50,
58
+ "transformer_block": {
59
+ "state_dim": 36,
60
+ "input_dim": 768,
61
+ "hidden_dim": 768,
62
+ "num_layers": 4,
63
+ "num_heads": 8,
64
+ "head_dim": 96,
65
+ "mlp_hidden_size": 256,
66
+ "dropout": 0.1,
67
+ "cross_attention_dim": 2048
68
+ },
69
+ "MoE_block": {
70
+ "num_experts_per_tok": 1,
71
+ "n_routed_experts": 16,
72
+ "scoring_func": "softmax",
73
+ "aux_loss_alpha": 0.01,
74
+ "seq_aux": true,
75
+ "norm_topk_prob": true,
76
+ "condition_dim": 7,
77
+ "moe_intermediate_size": 1536,
78
+ "n_shared_experts": 2,
79
+ "hidden_size": 768,
80
+ "intermediate_size": 1536,
81
+ "hidden_act": "silu",
82
+ "pretraining_tp": 1
83
+ }
84
+ },
85
+ "reduce_in_full_precision": true
86
+ },
87
+ "datasets": {
88
+ "vlm_data": {
89
+ "dataset_py": "vlm_datasets",
90
+ "dataformat": "llava_json",
91
+ "dataset_use": "asv2_conversation_en,asv2_detailed_description_en,asv2_region_captioning_en,coco_internvl_longcap_en,coco_karpathy_train_567_en,coco_negative_gpt4o_en,coco_poetry_zh,coco_rem_en_zh,cocorem_exist_yorn_en,cocotextv2_en,cocotextv2_gpt4o_en,okvqa_en,refcoco_grounding_aug_en,refcoco_grounding_en,tallyqa_coco_en,toloka_grounding_aug_en,vqav2_en,vsr_en",
92
+ "eval_dataset": "aokvqa_cauldron_llava_format",
93
+ "data_flatten": false,
94
+ "base_interval": 2,
95
+ "max_pixels": 12845056,
96
+ "min_pixels": 3136,
97
+ "model_max_length": 2048,
98
+ "model_type": "qwen2.5vl",
99
+ "per_device_batch_size": 4
100
+ },
101
+ "vla_data": {
102
+ "dataset_py": "lerobot_datasets",
103
+ "data_root_dir": "/mnt/dataset/vnwy44/data/eai_real_world",
104
+ "data_mix": "EAI_real_world",
105
+ "action_type": "delta_qpos",
106
+ "CoT_prompt": "Your task is {instruction}. To identify the key objects for your task. Locate their bounding boxes in [x1,y1,x2,y2] format.",
107
+ "CoT_answer": "bbox",
108
+ "default_image_resolution": [
109
+ 3,
110
+ 224,
111
+ 224
112
+ ],
113
+ "per_device_batch_size": 16,
114
+ "load_all_data_for_training": true,
115
+ "obs": [
116
+ "image_0"
117
+ ],
118
+ "delete_pause_frame": false,
119
+ "need_state": true,
120
+ "need_tag": true,
121
+ "vision_history_length": 2,
122
+ "action_chunk_size": 100
123
+ }
124
+ },
125
+ "trainer": {
126
+ "epochs": 100,
127
+ "num_warmup_steps_state": 2000,
128
+ "max_train_steps": 300000,
129
+ "num_warmup_steps": 5000,
130
+ "save_interval": 50000,
131
+ "eval_interval": 10000,
132
+ "learning_rate": {
133
+ "base": 2.5e-05,
134
+ "qwen_vl_interface": 1e-05,
135
+ "state_model": 2e-05,
136
+ "action_model": 2e-05
137
+ },
138
+ "lr_scheduler_type": "cosine_with_min_lr",
139
+ "scheduler_specific_kwargs": {
140
+ "min_lr": 1e-06
141
+ },
142
+ "freeze_modules": null,
143
+ "loss_scale": {
144
+ "vla": 1.0,
145
+ "vlm": 0.1
146
+ },
147
+ "max_grad_norm": 1.0,
148
+ "warmup_ratio": 0.1,
149
+ "weight_decay": 0.0,
150
+ "logging_frequency": 100,
151
+ "gradient_clipping": 1.0,
152
+ "gradient_accumulation_steps": 1,
153
+ "optimizer": {
154
+ "name": "AdamW",
155
+ "betas": [
156
+ 0.9,
157
+ 0.95
158
+ ],
159
+ "eps": 1e-08,
160
+ "weight_decay": 1e-08
161
+ },
162
+ "is_resume": false,
163
+ "resume_epoch": null,
164
+ "resume_step": null,
165
+ "enable_gradient_checkpointing": true,
166
+ "enable_mixed_precision_training": true
167
+ },
168
+ "output_dir": "./pretrained_models/hex/EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2"
169
+ }
EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2/config.yaml ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_id: hex_ac100_300k_8gpu_state_query_history2
2
+ run_root_dir: ./pretrained_models/hex/EAI_real_world_2B
3
+ seed: 42
4
+ trackers:
5
+ - jsonl
6
+ - wandb
7
+ wandb_entity: HEXTeam
8
+ wandb_project: hex
9
+ is_debug: false
10
+ enable_mee: false
11
+ mee_weight: 0.01
12
+ framework:
13
+ name: HEX
14
+ qwenvl:
15
+ base_vlm: /mnt/dataset/vnwy44/model/Qwen3-VL-2B-Instruct
16
+ attn_implementation: flash_attention_2
17
+ vl_hidden_dim: 2048
18
+ add_query: true
19
+ dino:
20
+ dino_backbone: dinov2_vits14
21
+ action_model:
22
+ action_model_type: DiT-B
23
+ action_hidden_dim: 2
24
+ hidden_size: 1024
25
+ add_pos_embed: true
26
+ max_seq_len: 1024
27
+ action_dim: 32
28
+ state_dim: 36
29
+ future_action_window_size: 99
30
+ action_horizon: 100
31
+ past_action_window_size: 0
32
+ repeated_diffusion_steps: 8
33
+ noise_beta_alpha: 1.5
34
+ noise_beta_beta: 1.0
35
+ noise_s: 0.999
36
+ num_timestep_buckets: 1000
37
+ num_inference_timesteps: 4
38
+ num_target_vision_tokens: 32
39
+ diffusion_model_cfg:
40
+ cross_attention_dim: 2048
41
+ cross_attention_dim_vl: 2048
42
+ cross_attention_dim_state: 768
43
+ dropout: 0.2
44
+ final_dropout: true
45
+ interleave_self_attention: true
46
+ norm_type: ada_norm
47
+ num_layers: 16
48
+ output_dim: 1024
49
+ positional_embeddings: null
50
+ state_model:
51
+ state_horizon: 50
52
+ transformer_block:
53
+ state_dim: 36
54
+ input_dim: 768
55
+ hidden_dim: 768
56
+ num_layers: 4
57
+ num_heads: 8
58
+ head_dim: 96
59
+ mlp_hidden_size: 256
60
+ dropout: 0.1
61
+ cross_attention_dim: 2048
62
+ MoE_block:
63
+ num_experts_per_tok: 1
64
+ n_routed_experts: 16
65
+ scoring_func: softmax
66
+ aux_loss_alpha: 0.01
67
+ seq_aux: true
68
+ norm_topk_prob: true
69
+ condition_dim: 7
70
+ moe_intermediate_size: 1536
71
+ n_shared_experts: 2
72
+ hidden_size: 768
73
+ intermediate_size: 1536
74
+ hidden_act: silu
75
+ pretraining_tp: 1
76
+ reduce_in_full_precision: true
77
+ datasets:
78
+ vlm_data:
79
+ dataset_py: vlm_datasets
80
+ dataformat: llava_json
81
+ dataset_use: asv2_conversation_en,asv2_detailed_description_en,asv2_region_captioning_en,coco_internvl_longcap_en,coco_karpathy_train_567_en,coco_negative_gpt4o_en,coco_poetry_zh,coco_rem_en_zh,cocorem_exist_yorn_en,cocotextv2_en,cocotextv2_gpt4o_en,okvqa_en,refcoco_grounding_aug_en,refcoco_grounding_en,tallyqa_coco_en,toloka_grounding_aug_en,vqav2_en,vsr_en
82
+ eval_dataset: aokvqa_cauldron_llava_format
83
+ data_flatten: false
84
+ base_interval: 2
85
+ max_pixels: 12845056
86
+ min_pixels: 3136
87
+ model_max_length: 2048
88
+ model_type: qwen2.5vl
89
+ per_device_batch_size: 4
90
+ vla_data:
91
+ dataset_py: lerobot_datasets
92
+ data_root_dir: /mnt/dataset/vnwy44/data/eai_real_world
93
+ data_mix: EAI_real_world
94
+ action_type: delta_qpos
95
+ CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
96
+ Locate their bounding boxes in [x1,y1,x2,y2] format.
97
+ CoT_answer: bbox
98
+ default_image_resolution:
99
+ - 3
100
+ - 224
101
+ - 224
102
+ per_device_batch_size: 16
103
+ load_all_data_for_training: true
104
+ obs:
105
+ - image_0
106
+ delete_pause_frame: false
107
+ need_state: true
108
+ need_tag: true
109
+ vision_history_length: 2
110
+ action_chunk_size: 100
111
+ trainer:
112
+ epochs: 100
113
+ num_warmup_steps_state: 2000
114
+ max_train_steps: 300000
115
+ num_warmup_steps: 5000
116
+ save_interval: 50000
117
+ eval_interval: 10000
118
+ learning_rate:
119
+ base: 2.5e-05
120
+ qwen_vl_interface: 1.0e-05
121
+ state_model: 2.0e-05
122
+ action_model: 2.0e-05
123
+ lr_scheduler_type: cosine_with_min_lr
124
+ scheduler_specific_kwargs:
125
+ min_lr: 1.0e-06
126
+ freeze_modules: null
127
+ loss_scale:
128
+ vla: 1.0
129
+ vlm: 0.1
130
+ max_grad_norm: 1.0
131
+ warmup_ratio: 0.1
132
+ weight_decay: 0.0
133
+ logging_frequency: 100
134
+ gradient_clipping: 1.0
135
+ gradient_accumulation_steps: 1
136
+ optimizer:
137
+ name: AdamW
138
+ betas:
139
+ - 0.9
140
+ - 0.95
141
+ eps: 1.0e-08
142
+ weight_decay: 1.0e-08
143
+ is_resume: false
144
+ resume_epoch: null
145
+ resume_step: null
146
+ enable_gradient_checkpointing: true
147
+ enable_mixed_precision_training: true
148
+ output_dir: ./pretrained_models/hex/EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2
EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2/dataset_statistics.json ADDED
The diff for this file is too large to render. See raw diff
 
EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2/embodiment_registry.json ADDED
@@ -0,0 +1,394 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "state_registry": {
3
+ "tienkung2_v1": {
4
+ "left_arm": {
5
+ "start": 0,
6
+ "end": 7,
7
+ "dim": 7
8
+ },
9
+ "left_hand": {
10
+ "start": 7,
11
+ "end": 13,
12
+ "dim": 6
13
+ },
14
+ "right_arm": {
15
+ "start": 13,
16
+ "end": 20,
17
+ "dim": 7
18
+ },
19
+ "right_hand": {
20
+ "start": 20,
21
+ "end": 26,
22
+ "dim": 6
23
+ },
24
+ "head": {
25
+ "start": 26,
26
+ "end": 29,
27
+ "dim": 3
28
+ },
29
+ "waist": {
30
+ "start": 29,
31
+ "end": 33,
32
+ "dim": 4
33
+ }
34
+ },
35
+ "tienkung2_v2": {
36
+ "left_arm": {
37
+ "start": 0,
38
+ "end": 7,
39
+ "dim": 7
40
+ },
41
+ "left_hand": {
42
+ "start": 7,
43
+ "end": 13,
44
+ "dim": 6
45
+ },
46
+ "right_arm": {
47
+ "start": 13,
48
+ "end": 20,
49
+ "dim": 7
50
+ },
51
+ "right_hand": {
52
+ "start": 20,
53
+ "end": 26,
54
+ "dim": 6
55
+ },
56
+ "waist": {
57
+ "start": 26,
58
+ "end": 30,
59
+ "dim": 4
60
+ }
61
+ },
62
+ "tienkung2_v3": {
63
+ "left_arm": {
64
+ "start": 0,
65
+ "end": 7,
66
+ "dim": 7
67
+ },
68
+ "left_hand": {
69
+ "start": 7,
70
+ "end": 13,
71
+ "dim": 6
72
+ },
73
+ "right_arm": {
74
+ "start": 13,
75
+ "end": 20,
76
+ "dim": 7
77
+ },
78
+ "right_hand": {
79
+ "start": 20,
80
+ "end": 26,
81
+ "dim": 6
82
+ },
83
+ "waist": {
84
+ "start": 26,
85
+ "end": 30,
86
+ "dim": 4
87
+ },
88
+ "others": {
89
+ "start": 30,
90
+ "end": 36,
91
+ "dim": 6
92
+ }
93
+ },
94
+ "tienkung3_v1": {
95
+ "left_arm": {
96
+ "start": 0,
97
+ "end": 7,
98
+ "dim": 7
99
+ },
100
+ "left_hand": {
101
+ "start": 7,
102
+ "end": 13,
103
+ "dim": 6
104
+ },
105
+ "right_arm": {
106
+ "start": 13,
107
+ "end": 20,
108
+ "dim": 7
109
+ },
110
+ "right_hand": {
111
+ "start": 20,
112
+ "end": 26,
113
+ "dim": 6
114
+ },
115
+ "waist": {
116
+ "start": 26,
117
+ "end": 29,
118
+ "dim": 3
119
+ },
120
+ "left_leg": {
121
+ "start": 29,
122
+ "end": 35,
123
+ "dim": 6
124
+ },
125
+ "right_leg": {
126
+ "start": 35,
127
+ "end": 41,
128
+ "dim": 6
129
+ },
130
+ "others": {
131
+ "start": 41,
132
+ "end": 51,
133
+ "dim": 10
134
+ }
135
+ },
136
+ "tienkung3_v2": {
137
+ "left_arm": {
138
+ "start": 0,
139
+ "end": 7,
140
+ "dim": 7
141
+ },
142
+ "left_hand": {
143
+ "start": 7,
144
+ "end": 8,
145
+ "dim": 1
146
+ },
147
+ "right_arm": {
148
+ "start": 8,
149
+ "end": 15,
150
+ "dim": 7
151
+ },
152
+ "right_hand": {
153
+ "start": 15,
154
+ "end": 21,
155
+ "dim": 6
156
+ },
157
+ "waist": {
158
+ "start": 21,
159
+ "end": 24,
160
+ "dim": 3
161
+ },
162
+ "left_leg": {
163
+ "start": 24,
164
+ "end": 30,
165
+ "dim": 6
166
+ },
167
+ "right_leg": {
168
+ "start": 30,
169
+ "end": 36,
170
+ "dim": 6
171
+ },
172
+ "others": {
173
+ "start": 36,
174
+ "end": 46,
175
+ "dim": 10
176
+ }
177
+ },
178
+ "tienkung3_v3": {
179
+ "left_arm": {
180
+ "start": 0,
181
+ "end": 7,
182
+ "dim": 7
183
+ },
184
+ "right_arm": {
185
+ "start": 7,
186
+ "end": 14,
187
+ "dim": 7
188
+ },
189
+ "right_hand": {
190
+ "start": 14,
191
+ "end": 20,
192
+ "dim": 6
193
+ },
194
+ "others": {
195
+ "start": 20,
196
+ "end": 40,
197
+ "dim": 20
198
+ },
199
+ "waist": {
200
+ "start": 40,
201
+ "end": 43,
202
+ "dim": 3
203
+ },
204
+ "head": {
205
+ "start": 43,
206
+ "end": 46,
207
+ "dim": 3
208
+ }
209
+ },
210
+ "tianyi_v1": {
211
+ "left_arm": {
212
+ "start": 0,
213
+ "end": 7,
214
+ "dim": 7
215
+ },
216
+ "left_hand": {
217
+ "start": 7,
218
+ "end": 8,
219
+ "dim": 1
220
+ },
221
+ "right_arm": {
222
+ "start": 8,
223
+ "end": 15,
224
+ "dim": 7
225
+ },
226
+ "right_hand": {
227
+ "start": 15,
228
+ "end": 16,
229
+ "dim": 1
230
+ }
231
+ },
232
+ "unitree_g1_v2": {
233
+ "left_arm": {
234
+ "start": 0,
235
+ "end": 7,
236
+ "dim": 7
237
+ },
238
+ "right_arm": {
239
+ "start": 7,
240
+ "end": 14,
241
+ "dim": 7
242
+ },
243
+ "left_hand": {
244
+ "start": 14,
245
+ "end": 21,
246
+ "dim": 7
247
+ },
248
+ "right_hand": {
249
+ "start": 21,
250
+ "end": 28,
251
+ "dim": 7
252
+ },
253
+ "left_leg": {
254
+ "start": 28,
255
+ "end": 34,
256
+ "dim": 6
257
+ },
258
+ "right_leg": {
259
+ "start": 34,
260
+ "end": 40,
261
+ "dim": 6
262
+ }
263
+ },
264
+ "unitree_g1_v1": {
265
+ "left_arm": {
266
+ "start": 0,
267
+ "end": 7,
268
+ "dim": 7
269
+ },
270
+ "right_arm": {
271
+ "start": 7,
272
+ "end": 14,
273
+ "dim": 7
274
+ },
275
+ "left_hand": {
276
+ "start": 14,
277
+ "end": 21,
278
+ "dim": 7
279
+ },
280
+ "right_hand": {
281
+ "start": 21,
282
+ "end": 28,
283
+ "dim": 7
284
+ },
285
+ "left_leg": {
286
+ "start": 28,
287
+ "end": 34,
288
+ "dim": 6
289
+ },
290
+ "right_leg": {
291
+ "start": 34,
292
+ "end": 40,
293
+ "dim": 6
294
+ },
295
+ "waist": {
296
+ "start": 40,
297
+ "end": 43,
298
+ "dim": 3
299
+ }
300
+ },
301
+ "unitree_h1_v1": {
302
+ "left_arm": {
303
+ "start": 0,
304
+ "end": 7,
305
+ "dim": 7
306
+ },
307
+ "right_arm": {
308
+ "start": 7,
309
+ "end": 14,
310
+ "dim": 7
311
+ },
312
+ "left_hand": {
313
+ "start": 14,
314
+ "end": 20,
315
+ "dim": 6
316
+ },
317
+ "right_hand": {
318
+ "start": 20,
319
+ "end": 26,
320
+ "dim": 6
321
+ },
322
+ "left_leg": {
323
+ "start": 26,
324
+ "end": 32,
325
+ "dim": 6
326
+ },
327
+ "right_leg": {
328
+ "start": 32,
329
+ "end": 38,
330
+ "dim": 6
331
+ },
332
+ "waist": {
333
+ "start": 38,
334
+ "end": 39,
335
+ "dim": 1
336
+ }
337
+ },
338
+ "leju_kuavo_v1": {
339
+ "left_arm": {
340
+ "start": 0,
341
+ "end": 7,
342
+ "dim": 7
343
+ },
344
+ "right_arm": {
345
+ "start": 7,
346
+ "end": 14,
347
+ "dim": 7
348
+ },
349
+ "left_leg": {
350
+ "start": 14,
351
+ "end": 20,
352
+ "dim": 6
353
+ },
354
+ "right_leg": {
355
+ "start": 20,
356
+ "end": 26,
357
+ "dim": 6
358
+ },
359
+ "left_hand": {
360
+ "start": 26,
361
+ "end": 32,
362
+ "dim": 6
363
+ },
364
+ "right_hand": {
365
+ "start": 32,
366
+ "end": 38,
367
+ "dim": 6
368
+ },
369
+ "head": {
370
+ "start": 38,
371
+ "end": 40,
372
+ "dim": 2
373
+ },
374
+ "others": {
375
+ "start": 40,
376
+ "end": 118,
377
+ "dim": 78
378
+ }
379
+ }
380
+ },
381
+ "action_registry": {
382
+ "tienkung2_v1": 23,
383
+ "tienkung2_v2": 20,
384
+ "tienkung2_v3": 32,
385
+ "tienkung3_v1": 20,
386
+ "tienkung3_v2": 20,
387
+ "tienkung3_v3": 8,
388
+ "tianyi_v1": 16,
389
+ "unitree_g1_v2": 32,
390
+ "unitree_g1_v1": 28,
391
+ "unitree_h1_v1": 26,
392
+ "leju_kuavo_v1": 54
393
+ }
394
+ }
EAI_real_world_2B/hex_ac100_300k_8gpu_state_query_history2/summary.jsonl ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {"steps": 50000}
2
+ {"steps": 100000}
3
+ {"steps": 150000}
4
+ {"steps": 200000}
5
+ {"steps": 250000}
6
+ {"steps": 300000}