usr256864 commited on
Commit
25c33ec
·
verified ·
1 Parent(s): f0e63ad

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +6 -14
  2. config.json +37 -31
  3. model.safetensors +2 -2
  4. train_config.json +114 -57
README.md CHANGED
@@ -1,29 +1,21 @@
1
  ---
2
- datasets: rh5_sample_dataset
3
  library_name: lerobot
4
  license: apache-2.0
5
- model_name: pi0
6
  pipeline_tag: robotics
7
  tags:
8
- - pi0
9
- - lerobot
10
  - robotics
 
 
11
  ---
12
 
13
- # Model Card for pi0
14
 
15
  <!-- Provide a quick summary of what the model is/does. -->
16
 
17
 
18
- **π₀ (Pi0)**
19
-
20
- π₀ is a Vision-Language-Action model for general robot control, from Physical Intelligence. The LeRobot implementation is adapted from their open source OpenPI repository.
21
-
22
- **Model Overview**
23
-
24
- π₀ represents a breakthrough in robotics as the first general-purpose robot foundation model developed by Physical Intelligence. Unlike traditional robots that are narrow specialists programmed for repetitive motions, π₀ is designed to be a generalist policy that can understand visual inputs, interpret natural language instructions, and control a variety of different robots across diverse tasks.
25
-
26
- For more details, see the [Physical Intelligence π₀ blog post](https://www.physicalintelligence.company/blog/pi0).
27
 
28
 
29
  This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).
 
1
  ---
2
+ datasets: usr256864/lr_ds
3
  library_name: lerobot
4
  license: apache-2.0
5
+ model_name: groot
6
  pipeline_tag: robotics
7
  tags:
 
 
8
  - robotics
9
+ - lerobot
10
+ - groot
11
  ---
12
 
13
+ # Model Card for groot
14
 
15
  <!-- Provide a quick summary of what the model is/does. -->
16
 
17
 
18
+ _Model type not recognized — please update this template._
 
 
 
 
 
 
 
 
19
 
20
 
21
  This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "type": "pi0",
3
  "n_obs_steps": 1,
4
  "input_features": {
5
  "observation.image": {
@@ -27,49 +27,55 @@
27
  },
28
  "device": "cuda",
29
  "use_amp": false,
30
- "push_to_hub": false,
 
31
  "repo_id": "usr256864/pi0",
32
  "private": null,
33
  "tags": null,
34
  "license": null,
35
- "pretrained_path": "outputs/train/2025-11-14/01-13-16_pi0_training/checkpoints/080000/pretrained_model",
36
- "paligemma_variant": "gemma_2b",
37
- "action_expert_variant": "gemma_300m",
38
- "dtype": "bfloat16",
39
  "chunk_size": 50,
40
  "n_action_steps": 50,
41
- "max_state_dim": 32,
42
  "max_action_dim": 32,
43
- "num_inference_steps": 10,
44
- "time_sampling_beta_alpha": 1.5,
45
- "time_sampling_beta_beta": 1.0,
46
- "time_sampling_scale": 0.999,
47
- "time_sampling_offset": 0.001,
48
- "min_period": 0.004,
49
- "max_period": 4.0,
50
- "image_resolution": [
51
- 224,
52
- 224
53
- ],
54
- "empty_cameras": 0,
55
  "normalization_mapping": {
56
  "VISUAL": "IDENTITY",
57
  "STATE": "MEAN_STD",
58
  "ACTION": "MEAN_STD"
59
  },
60
- "gradient_checkpointing": true,
61
- "compile_model": false,
62
- "compile_mode": "max-autotune",
63
- "optimizer_lr": 2.5e-05,
 
 
 
 
 
 
 
 
 
 
 
 
64
  "optimizer_betas": [
65
- 0.9,
66
- 0.95
67
  ],
68
  "optimizer_eps": 1e-08,
69
- "optimizer_weight_decay": 0.01,
70
- "optimizer_grad_clip_norm": 1.0,
71
- "scheduler_warmup_steps": 1000,
72
- "scheduler_decay_steps": 30000,
73
- "scheduler_decay_lr": 2.5e-06,
74
- "tokenizer_max_length": 48
 
 
 
 
 
 
 
 
75
  }
 
1
  {
2
+ "type": "groot",
3
  "n_obs_steps": 1,
4
  "input_features": {
5
  "observation.image": {
 
27
  },
28
  "device": "cuda",
29
  "use_amp": false,
30
+ "use_peft": false,
31
+ "push_to_hub": true,
32
  "repo_id": "usr256864/pi0",
33
  "private": null,
34
  "tags": null,
35
  "license": null,
36
+ "pretrained_path": null,
 
 
 
37
  "chunk_size": 50,
38
  "n_action_steps": 50,
39
+ "max_state_dim": 64,
40
  "max_action_dim": 32,
 
 
 
 
 
 
 
 
 
 
 
 
41
  "normalization_mapping": {
42
  "VISUAL": "IDENTITY",
43
  "STATE": "MEAN_STD",
44
  "ACTION": "MEAN_STD"
45
  },
46
+ "image_size": [
47
+ 224,
48
+ 224
49
+ ],
50
+ "base_model_path": "nvidia/GR00T-N1.5-3B",
51
+ "tokenizer_assets_repo": "lerobot/eagle2hg-processor-groot-n1p5",
52
+ "embodiment_tag": "new_embodiment",
53
+ "tune_llm": false,
54
+ "tune_visual": false,
55
+ "tune_projector": true,
56
+ "tune_diffusion_model": true,
57
+ "lora_rank": 0,
58
+ "lora_alpha": 16,
59
+ "lora_dropout": 0.1,
60
+ "lora_full_model": false,
61
+ "optimizer_lr": 0.0001,
62
  "optimizer_betas": [
63
+ 0.95,
64
+ 0.999
65
  ],
66
  "optimizer_eps": 1e-08,
67
+ "optimizer_weight_decay": 1e-05,
68
+ "warmup_ratio": 0.05,
69
+ "use_bf16": true,
70
+ "video_backend": "decord",
71
+ "balance_dataset_weights": true,
72
+ "balance_trajectory_weights": true,
73
+ "dataset_paths": null,
74
+ "output_dir": "./tmp/gr00t",
75
+ "save_steps": 1000,
76
+ "max_steps": 10000,
77
+ "batch_size": 32,
78
+ "dataloader_num_workers": 8,
79
+ "report_to": "wandb",
80
+ "resume": false
81
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7bd1aaac8507f32f420e53e36701f0a3b23fe63a53ef25405384355c1a35e9d
3
- size 7011548640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:411b556159f0e7518b7ee80cffdc85dc6f5e54c8c5722ae86b30308c349e5b48
3
+ size 6964802952
train_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "dataset": {
3
- "repo_id": "rh5_sample_dataset",
4
- "root": "../datasets/RH5_dataset/",
5
  "episodes": null,
6
  "image_transforms": {
7
  "enable": false,
@@ -79,9 +79,48 @@
79
  "video_backend": "torchcodec",
80
  "streaming": false
81
  },
82
- "env": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
83
  "policy": {
84
- "type": "pi0",
85
  "n_obs_steps": 1,
86
  "input_features": {
87
  "observation.image": {
@@ -109,96 +148,114 @@
109
  },
110
  "device": "cuda",
111
  "use_amp": false,
112
- "push_to_hub": false,
 
113
  "repo_id": "usr256864/pi0",
114
  "private": null,
115
  "tags": null,
116
  "license": null,
117
- "pretrained_path": "outputs/train/2025-11-14/01-13-16_pi0_training/checkpoints/080000/pretrained_model",
118
- "paligemma_variant": "gemma_2b",
119
- "action_expert_variant": "gemma_300m",
120
- "dtype": "bfloat16",
121
  "chunk_size": 50,
122
  "n_action_steps": 50,
123
- "max_state_dim": 32,
124
  "max_action_dim": 32,
125
- "num_inference_steps": 10,
126
- "time_sampling_beta_alpha": 1.5,
127
- "time_sampling_beta_beta": 1.0,
128
- "time_sampling_scale": 0.999,
129
- "time_sampling_offset": 0.001,
130
- "min_period": 0.004,
131
- "max_period": 4.0,
132
- "image_resolution": [
133
- 224,
134
- 224
135
- ],
136
- "empty_cameras": 0,
137
  "normalization_mapping": {
138
  "VISUAL": "IDENTITY",
139
  "STATE": "MEAN_STD",
140
  "ACTION": "MEAN_STD"
141
  },
142
- "gradient_checkpointing": true,
143
- "compile_model": false,
144
- "compile_mode": "max-autotune",
145
- "optimizer_lr": 2.5e-05,
 
 
 
 
 
 
 
 
 
 
 
 
146
  "optimizer_betas": [
147
- 0.9,
148
- 0.95
149
  ],
150
  "optimizer_eps": 1e-08,
151
- "optimizer_weight_decay": 0.01,
152
- "optimizer_grad_clip_norm": 1.0,
153
- "scheduler_warmup_steps": 1000,
154
- "scheduler_decay_steps": 30000,
155
- "scheduler_decay_lr": 2.5e-06,
156
- "tokenizer_max_length": 48
 
 
 
 
 
 
 
 
157
  },
158
- "output_dir": "outputs/train/2025-11-14/01-13-16_pi0_training",
159
- "job_name": "pi0_training",
160
- "resume": true,
161
  "seed": 1000,
162
  "num_workers": 4,
163
- "batch_size": 32,
164
- "steps": 200000,
165
- "eval_freq": 20000,
166
- "log_freq": 200,
 
167
  "save_checkpoint": true,
168
- "save_freq": 20000,
169
  "use_policy_training_preset": true,
170
  "optimizer": {
171
  "type": "adamw",
172
- "lr": 2.5e-05,
173
- "weight_decay": 0.01,
174
- "grad_clip_norm": 1.0,
175
  "betas": [
176
- 0.9,
177
- 0.95
178
  ],
179
  "eps": 1e-08
180
  },
181
  "scheduler": {
182
  "type": "cosine_decay_with_warmup",
183
- "num_warmup_steps": 1000,
184
- "num_decay_steps": 30000,
185
- "peak_lr": 2.5e-05,
186
- "decay_lr": 2.5e-06
187
  },
188
  "eval": {
189
- "n_episodes": 50,
190
- "batch_size": 50,
191
  "use_async_envs": false
192
  },
193
  "wandb": {
194
- "enable": true,
195
  "disable_artifact": true,
196
  "project": "lerobot",
197
  "entity": null,
198
  "notes": null,
199
- "run_id": "k9pdbqh0",
200
  "mode": null
201
  },
202
- "checkpoint_path": "outputs/train/2025-11-14/01-13-16_pi0_training/checkpoints/080000",
203
- "rename_map": {}
 
 
 
 
 
 
 
 
 
 
 
204
  }
 
1
  {
2
  "dataset": {
3
+ "repo_id": "usr256864/lr_ds",
4
+ "root": "../datasets/RH5_dataset_qdot/",
5
  "episodes": null,
6
  "image_transforms": {
7
  "enable": false,
 
79
  "video_backend": "torchcodec",
80
  "streaming": false
81
  },
82
+ "env": {
83
+ "type": "rh5",
84
+ "task": "walk",
85
+ "fps": 30,
86
+ "features": {
87
+ "action": {
88
+ "type": "ACTION",
89
+ "shape": [
90
+ 32
91
+ ]
92
+ },
93
+ "agent_pos": {
94
+ "type": "STATE",
95
+ "shape": [
96
+ 63
97
+ ]
98
+ },
99
+ "pixels/top": {
100
+ "type": "VISUAL",
101
+ "shape": [
102
+ 480,
103
+ 640,
104
+ 3
105
+ ]
106
+ }
107
+ },
108
+ "features_map": {
109
+ "action": "action",
110
+ "agent_pos": "observation.state",
111
+ "top": "observation.image",
112
+ "pixels/top": "observation.image"
113
+ },
114
+ "max_parallel_tasks": 1,
115
+ "disable_env_checker": true,
116
+ "config": null,
117
+ "episode_length": 1000,
118
+ "obs_type": "pixels_agent_pos",
119
+ "render_mode": "rgb_array",
120
+ "use_velocity": false
121
+ },
122
  "policy": {
123
+ "type": "groot",
124
  "n_obs_steps": 1,
125
  "input_features": {
126
  "observation.image": {
 
148
  },
149
  "device": "cuda",
150
  "use_amp": false,
151
+ "use_peft": false,
152
+ "push_to_hub": true,
153
  "repo_id": "usr256864/pi0",
154
  "private": null,
155
  "tags": null,
156
  "license": null,
157
+ "pretrained_path": null,
 
 
 
158
  "chunk_size": 50,
159
  "n_action_steps": 50,
160
+ "max_state_dim": 64,
161
  "max_action_dim": 32,
 
 
 
 
 
 
 
 
 
 
 
 
162
  "normalization_mapping": {
163
  "VISUAL": "IDENTITY",
164
  "STATE": "MEAN_STD",
165
  "ACTION": "MEAN_STD"
166
  },
167
+ "image_size": [
168
+ 224,
169
+ 224
170
+ ],
171
+ "base_model_path": "nvidia/GR00T-N1.5-3B",
172
+ "tokenizer_assets_repo": "lerobot/eagle2hg-processor-groot-n1p5",
173
+ "embodiment_tag": "new_embodiment",
174
+ "tune_llm": false,
175
+ "tune_visual": false,
176
+ "tune_projector": true,
177
+ "tune_diffusion_model": true,
178
+ "lora_rank": 0,
179
+ "lora_alpha": 16,
180
+ "lora_dropout": 0.1,
181
+ "lora_full_model": false,
182
+ "optimizer_lr": 0.0001,
183
  "optimizer_betas": [
184
+ 0.95,
185
+ 0.999
186
  ],
187
  "optimizer_eps": 1e-08,
188
+ "optimizer_weight_decay": 1e-05,
189
+ "warmup_ratio": 0.05,
190
+ "use_bf16": true,
191
+ "video_backend": "decord",
192
+ "balance_dataset_weights": true,
193
+ "balance_trajectory_weights": true,
194
+ "dataset_paths": null,
195
+ "output_dir": "./tmp/gr00t",
196
+ "save_steps": 1000,
197
+ "max_steps": 10000,
198
+ "batch_size": 32,
199
+ "dataloader_num_workers": 8,
200
+ "report_to": "wandb",
201
+ "resume": false
202
  },
203
+ "output_dir": "outputs/train/2026-02-11/13-18-22_debug_train",
204
+ "job_name": "debug_train",
205
+ "resume": false,
206
  "seed": 1000,
207
  "num_workers": 4,
208
+ "batch_size": 1,
209
+ "steps": 2,
210
+ "eval_freq": 0,
211
+ "log_freq": 2,
212
+ "tolerance_s": 0.0001,
213
  "save_checkpoint": true,
214
+ "save_freq": 2,
215
  "use_policy_training_preset": true,
216
  "optimizer": {
217
  "type": "adamw",
218
+ "lr": 0.0001,
219
+ "weight_decay": 1e-05,
220
+ "grad_clip_norm": 10.0,
221
  "betas": [
222
+ 0.95,
223
+ 0.999
224
  ],
225
  "eps": 1e-08
226
  },
227
  "scheduler": {
228
  "type": "cosine_decay_with_warmup",
229
+ "num_warmup_steps": 500,
230
+ "num_decay_steps": 10000,
231
+ "peak_lr": 0.0001,
232
+ "decay_lr": 1e-05
233
  },
234
  "eval": {
235
+ "n_episodes": 1,
236
+ "batch_size": 1,
237
  "use_async_envs": false
238
  },
239
  "wandb": {
240
+ "enable": false,
241
  "disable_artifact": true,
242
  "project": "lerobot",
243
  "entity": null,
244
  "notes": null,
245
+ "run_id": null,
246
  "mode": null
247
  },
248
+ "peft": null,
249
+ "use_rabc": false,
250
+ "rabc_progress_path": null,
251
+ "rabc_kappa": 0.01,
252
+ "rabc_epsilon": 1e-06,
253
+ "rabc_head_mode": "sparse",
254
+ "rename_map": {},
255
+ "checkpoint_path": null,
256
+ "eval_ds": "../datasets/RH5_dataset_qdot/",
257
+ "episode_idx": 0,
258
+ "absolute": false,
259
+ "num_eval_samples": 20,
260
+ "use_velocity": true
261
  }