VLyb commited on
Commit
92f6a68
·
verified ·
1 Parent(s): 3986c27

Upload folder using huggingface_hub

Browse files
config.yaml ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ datasets:
2
+ vla_data:
3
+ CoT_prompt: '{instruction}'
4
+ data_mix: fourier_gr1_unified_1000
5
+ data_root_dir: playground/Datasets/PhysicalAI-Robotics-GR00T-X-Embodiment-Sim
6
+ delete_pause_frame: false
7
+ image_size:
8
+ - 224
9
+ - 224
10
+ per_device_batch_size: 16
11
+ video_backend: pyav
12
+ frameskip:
13
+ cache_dir: playground/frameskip/frameskip_cache_vac_cr20-100
14
+ default_compression_ratio: 1.0
15
+ enabled: true
16
+ importance:
17
+ allow_backend_fallback: false
18
+ alpha: 0.6
19
+ beta: 0.2
20
+ device: cuda
21
+ enable_vac: true
22
+ gamma: 0.2
23
+ max_vac_frames: 16
24
+ type: gripper_aware
25
+ vac_beta: 0.2
26
+ video_backend: ffmpeg
27
+ visual_encoder_checkpoint: /mnt/project_ai4edu/share/models/timm/vit_large_patch14_dinov2.lvd142m/pytorch_model.bin
28
+ visual_encoder_name: vit_large_patch14_dinov2
29
+ pruning:
30
+ compression_ratios:
31
+ - 0.2
32
+ - 0.3
33
+ - 0.4
34
+ - 0.5
35
+ - 0.6
36
+ - 0.7
37
+ - 0.8
38
+ - 0.9
39
+ - 1.0
40
+ used_compression_ratios:
41
+ - 0.2
42
+ - 0.2
43
+ - 0.2
44
+ - 0.2
45
+ - 0.2
46
+ - 1.0
47
+ training:
48
+ dynamic_ratio: true
49
+ ratio_schedule: uniform
50
+ warmup_steps: 5000
51
+ framework:
52
+ action_model:
53
+ action_dim: 29
54
+ action_horizon: 16
55
+ action_model_type: DiT-B
56
+ add_pos_embed: true
57
+ diffusion_model_cfg:
58
+ cross_attention_dim: 2560
59
+ dropout: 0.2
60
+ final_dropout: true
61
+ interleave_self_attention: true
62
+ norm_type: ada_norm
63
+ num_layers: 16
64
+ output_dim: 2560
65
+ positional_embeddings: null
66
+ future_action_window_size: 15
67
+ hidden_size: 2560
68
+ max_seq_len: 1024
69
+ noise_beta_alpha: 1.5
70
+ noise_beta_beta: 1.0
71
+ noise_s: 0.999
72
+ num_inference_timesteps: 4
73
+ num_target_vision_tokens: 32
74
+ num_timestep_buckets: 1000
75
+ past_action_window_size: 0
76
+ state_dim: 58
77
+ name: QwenGR00T
78
+ qwenvl:
79
+ base_vlm: Qwen/Qwen3-VL-4B-Instruct
80
+ template: qwen3_vl
81
+ run_root_dir: ./results/Checkpoints/FrameSkip/RoboCasa
82
+ seed: 42
83
+ trainer:
84
+ eval_interval: 1000
85
+ freeze_modules: true
86
+ gradient_accumulation_steps: 1
87
+ gradient_clipping: 1.0
88
+ is_resume: true
89
+ learning_rate:
90
+ action_model: 0.0001
91
+ base: 1.0e-05
92
+ qwen_vl_interface: 1.0e-05
93
+ logging_frequency: 100
94
+ lr_scheduler_type: cosine_with_min_lr
95
+ max_train_steps: 100000
96
+ num_warmup_steps: 5000
97
+ optimizer:
98
+ betas:
99
+ - 0.9
100
+ - 0.95
101
+ eps: 1.0e-08
102
+ weight_decay: 1.0e-08
103
+ save_interval: 10000
104
+ scheduler_specific_kwargs:
105
+ min_lr: 5.0e-07
106
+ wandb_entity: jinhuiye
107
+ wandb_project: starVLA
dataset_statistics.json ADDED
@@ -0,0 +1,413 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "gr1": {
3
+ "action": {
4
+ "mean": [
5
+ -0.17387242737175262,
6
+ 0.23178295650795291,
7
+ -0.11246717392234765,
8
+ -1.467058948616805,
9
+ 0.17808004331039098,
10
+ 0.0969788919022288,
11
+ -0.006060623051541402,
12
+ -0.32863660886675217,
13
+ -0.3234929513029891,
14
+ 0.07824063870040202,
15
+ -1.4673328909105674,
16
+ 0.3436010789007535,
17
+ 0.07368239935797284,
18
+ 0.17824148321565236,
19
+ -0.22454509710602624,
20
+ -0.22454509710602624,
21
+ -0.22454509710602624,
22
+ -0.22454509710602624,
23
+ -0.4490901942120525,
24
+ 1.1117459333448283,
25
+ -0.47756699373305467,
26
+ -0.47756699373305467,
27
+ -0.47756699373305467,
28
+ -0.47756699373305467,
29
+ -0.9551339874661093,
30
+ 3.0,
31
+ 0.0036528927656546556,
32
+ 0.006440042419582474,
33
+ -0.0002253371531922458
34
+ ],
35
+ "std": [
36
+ 0.3826029805228521,
37
+ 0.1781406519748235,
38
+ 0.2679951519523225,
39
+ 0.4803346762693267,
40
+ 0.2980327261875639,
41
+ 0.2925941807087268,
42
+ 0.32539785972692925,
43
+ 0.5154880467093165,
44
+ 0.28700745861256066,
45
+ 0.39340010996830976,
46
+ 0.7028232145801553,
47
+ 0.5286632242394153,
48
+ 0.397017790442305,
49
+ 0.6155189029066219,
50
+ 0.8853914917919973,
51
+ 0.8853914917919973,
52
+ 0.8853914917919973,
53
+ 0.8853914917919973,
54
+ 1.7707829835839946,
55
+ 1.4488819067562828,
56
+ 1.421995748357164,
57
+ 1.421995748357164,
58
+ 1.421995748357164,
59
+ 1.421995748357164,
60
+ 2.843991496714328,
61
+ 0.0,
62
+ 0.0695567278029747,
63
+ 0.020305646265368658,
64
+ 0.005463839840361966
65
+ ],
66
+ "max": [
67
+ 1.4058303833007812,
68
+ 1.288877010345459,
69
+ 1.2944501638412476,
70
+ 3.1500876502832398e-06,
71
+ 2.563594102859497,
72
+ 1.5000286102294922,
73
+ 1.4998135566711426,
74
+ 1.564226508140564,
75
+ 0.00015454324602615088,
76
+ 1.7984894514083862,
77
+ 5.365318065742031e-05,
78
+ 3.0000767707824707,
79
+ 1.4954047203063965,
80
+ 1.4975833892822266,
81
+ 1.5,
82
+ 1.5,
83
+ 1.5,
84
+ 1.5,
85
+ 3.0,
86
+ 3.0,
87
+ 1.5,
88
+ 1.5,
89
+ 1.5,
90
+ 1.5,
91
+ 3.0,
92
+ 3.0,
93
+ 0.9750414490699768,
94
+ 0.34772318601608276,
95
+ 0.5310259461402893
96
+ ],
97
+ "min": [
98
+ -1.710237741470337,
99
+ -0.00042632038821466267,
100
+ -1.4035195112228394,
101
+ -2.801373243331909,
102
+ -2.033860445022583,
103
+ -1.4939793348312378,
104
+ -1.3439968824386597,
105
+ -2.1020591259002686,
106
+ -2.2016870975494385,
107
+ -2.3005123138427734,
108
+ -2.848569631576538,
109
+ -3.000068426132202,
110
+ -1.4995447397232056,
111
+ -1.489180326461792,
112
+ -1.5,
113
+ -1.5,
114
+ -1.5,
115
+ -1.5,
116
+ -3.0,
117
+ 0.0,
118
+ -1.5,
119
+ -1.5,
120
+ -1.5,
121
+ -1.5,
122
+ -3.0,
123
+ 3.0,
124
+ -0.5332962870597839,
125
+ -0.4947744905948639,
126
+ -0.4128894805908203
127
+ ],
128
+ "q01": [
129
+ -1.6453754484653473,
130
+ -7.352335887844674e-05,
131
+ -1.1551570868492127,
132
+ -2.7360924339294432,
133
+ -0.8502070605754852,
134
+ -1.0754927098751068,
135
+ -1.2199868965148926,
136
+ -1.699393036365509,
137
+ -1.3113291025161744,
138
+ -0.9920944452285767,
139
+ -2.7749218344688416,
140
+ -0.9589024305343627,
141
+ -1.3624527990818023,
142
+ -1.177962738275528,
143
+ -1.5,
144
+ -1.5,
145
+ -1.5,
146
+ -1.5,
147
+ -3.0,
148
+ 0.0,
149
+ -1.5,
150
+ -1.5,
151
+ -1.5,
152
+ -1.5,
153
+ -3.0,
154
+ 3.0,
155
+ -0.45793325632810594,
156
+ -0.04522607177495956,
157
+ -0.029049276374280453
158
+ ],
159
+ "q99": [
160
+ 1.1092832422256476,
161
+ 1.140557736158371,
162
+ 0.7091880106925965,
163
+ -0.01566793117672205,
164
+ 1.4978188574314117,
165
+ 1.1059463322162628,
166
+ 1.0923435854911796,
167
+ 1.1635798215866089,
168
+ -4.211934747217997e-06,
169
+ 1.1038778030872343,
170
+ -0.03212724145501838,
171
+ 1.9471237277984617,
172
+ 1.2183190023899073,
173
+ 1.4874796867370605,
174
+ 1.5,
175
+ 1.5,
176
+ 1.5,
177
+ 1.5,
178
+ 3.0,
179
+ 3.0,
180
+ 1.5,
181
+ 1.5,
182
+ 1.5,
183
+ 1.5,
184
+ 3.0,
185
+ 3.0,
186
+ 0.2767475765943526,
187
+ 0.11469113424420346,
188
+ 0.014944081632420426
189
+ ],
190
+ "mask": [
191
+ true,
192
+ true,
193
+ true,
194
+ true,
195
+ true,
196
+ true,
197
+ true,
198
+ true,
199
+ true,
200
+ true,
201
+ true,
202
+ true,
203
+ true,
204
+ true,
205
+ true,
206
+ true,
207
+ true,
208
+ true,
209
+ true,
210
+ true,
211
+ true,
212
+ true,
213
+ true,
214
+ true,
215
+ true,
216
+ true,
217
+ true,
218
+ true,
219
+ true
220
+ ]
221
+ },
222
+ "state": {
223
+ "mean": [
224
+ -0.1710260256064159,
225
+ 0.23514010013260706,
226
+ -0.11290985507224512,
227
+ -1.4712710221923215,
228
+ 0.177862105393054,
229
+ 0.10149721653338932,
230
+ -0.00641375726169353,
231
+ -0.3203161980008616,
232
+ -0.3216722056395032,
233
+ 0.0849948406023539,
234
+ -1.472882336935645,
235
+ 0.33776022525175214,
236
+ 0.06909735923601293,
237
+ 0.16150971415455723,
238
+ 0.150227671335535,
239
+ 0.14950177079712157,
240
+ 0.13247238367410155,
241
+ 0.14930497337708834,
242
+ 0.034658935748789574,
243
+ 0.6349662932525478,
244
+ 0.48722118094888556,
245
+ 0.45771242576979354,
246
+ 0.4219110799674228,
247
+ 0.4522155710942671,
248
+ 0.07552173433224176,
249
+ 1.6706057664213183,
250
+ 0.003597618940209368,
251
+ 0.004405942099600034,
252
+ -8.767778306670624e-05
253
+ ],
254
+ "std": [
255
+ 0.37523450948864817,
256
+ 0.17813893782136045,
257
+ 0.26538151147352895,
258
+ 0.4662377915649439,
259
+ 0.2902752765220148,
260
+ 0.28593534005347176,
261
+ 0.31542085507384054,
262
+ 0.5024409297760511,
263
+ 0.2778536773357909,
264
+ 0.37863340646498084,
265
+ 0.6705175321753379,
266
+ 0.5231741476891753,
267
+ 0.3766218649545248,
268
+ 0.5706061777973751,
269
+ 0.41843350452688033,
270
+ 0.40050613293235954,
271
+ 0.35383605559505465,
272
+ 0.4026813894136598,
273
+ 0.13891330928169826,
274
+ 0.8207457531523573,
275
+ 0.593772268328117,
276
+ 0.5514249405930985,
277
+ 0.5070474508560131,
278
+ 0.5440991761001858,
279
+ 0.1703107040669717,
280
+ 0.21296248701379483,
281
+ 0.0662141869051629,
282
+ 0.019639382736588717,
283
+ 0.007552132377497403
284
+ ],
285
+ "max": [
286
+ 1.3502349853515625,
287
+ 1.2633577585220337,
288
+ 1.2589013576507568,
289
+ 0.001734813442453742,
290
+ 2.521491289138794,
291
+ 1.526998519897461,
292
+ 1.496475338935852,
293
+ 1.5148204565048218,
294
+ 0.003278259886428714,
295
+ 1.7851011753082275,
296
+ 0.0016116079641506076,
297
+ 3.0015335083007812,
298
+ 1.4080945253372192,
299
+ 1.4516682624816895,
300
+ 2.0179455280303955,
301
+ 2.009377956390381,
302
+ 2.6196515560150146,
303
+ 1.8978251218795776,
304
+ 3.2151029109954834,
305
+ 2.7924649715423584,
306
+ 2.7859506607055664,
307
+ 2.1664254665374756,
308
+ 3.0131356716156006,
309
+ 2.69866681098938,
310
+ 1.4733597040176392,
311
+ 2.079848289489746,
312
+ 0.937696099281311,
313
+ 0.3457968235015869,
314
+ 0.47687003016471863
315
+ ],
316
+ "min": [
317
+ -1.6789460182189941,
318
+ -0.026101894676685333,
319
+ -1.3480229377746582,
320
+ -2.5160419940948486,
321
+ -1.9940674304962158,
322
+ -1.3795876502990723,
323
+ -1.1958755254745483,
324
+ -2.0664756298065186,
325
+ -2.1021976470947266,
326
+ -2.296651601791382,
327
+ -2.5318210124969482,
328
+ -3.0013694763183594,
329
+ -1.4908946752548218,
330
+ -1.2908861637115479,
331
+ -1.4389894008636475,
332
+ -1.8303323984146118,
333
+ -2.4635109901428223,
334
+ -1.7167329788208008,
335
+ -2.218892812728882,
336
+ -1.526924967765808,
337
+ -1.4716511964797974,
338
+ -2.0171985626220703,
339
+ -2.412123203277588,
340
+ -1.189025640487671,
341
+ -0.8325809836387634,
342
+ -0.21484142541885376,
343
+ -0.5222951769828796,
344
+ -0.42820972204208374,
345
+ -0.39791223406791687
346
+ ],
347
+ "q01": [
348
+ -1.6401696801185608,
349
+ -0.0021117788553237913,
350
+ -1.136602680683136,
351
+ -2.5065788412094117,
352
+ -0.8428557366132736,
353
+ -1.0090796053409576,
354
+ -1.0905668175220489,
355
+ -1.6940901970863342,
356
+ -1.2592608690261842,
357
+ -0.9485023188591003,
358
+ -2.524535834789276,
359
+ -0.9369082593917847,
360
+ -1.2690116608142852,
361
+ -1.070357494354248,
362
+ -0.48410280704498293,
363
+ -0.26667029321193697,
364
+ -0.22677424252033235,
365
+ -0.2616843205690384,
366
+ -0.2044905386865139,
367
+ -0.046128811538219454,
368
+ -0.025738642178475858,
369
+ -0.008413693476468325,
370
+ -0.06011074289679527,
371
+ -0.007438082443550229,
372
+ -0.49244091659784317,
373
+ 0.32079766273498533,
374
+ -0.4424374091625214,
375
+ -0.042612580582499504,
376
+ -0.030681067146360874
377
+ ],
378
+ "q99": [
379
+ 1.1068614256382001,
380
+ 1.135889083147049,
381
+ 0.7082531070709233,
382
+ -0.030924458522349596,
383
+ 1.4936031103134155,
384
+ 1.071806162595749,
385
+ 1.0435830056667328,
386
+ 1.1315186619758606,
387
+ 0.0004920228820992634,
388
+ 1.0889833045005788,
389
+ -0.0453558095544572,
390
+ 1.9339820933341976,
391
+ 1.0967729890346527,
392
+ 1.2506092643737792,
393
+ 1.508325070142746,
394
+ 1.5029944777488708,
395
+ 1.5275386273860931,
396
+ 1.5626549482345582,
397
+ 1.1534690403938292,
398
+ 1.9877541887760162,
399
+ 1.6979391312599157,
400
+ 1.5753892362117767,
401
+ 2.761149823665619,
402
+ 1.699782818555832,
403
+ 0.898365780711174,
404
+ 1.8441466689109802,
405
+ 0.2744007483124733,
406
+ 0.11413956061005591,
407
+ 0.04111658498644853
408
+ ]
409
+ },
410
+ "num_transitions": 6020058,
411
+ "num_trajectories": 24000
412
+ }
413
+ }
final_model/pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a1e1bc66e9f3bb3bc9ded5a5a0cc5b17bee5d4a89992a1698358672a9708b08
3
+ size 9993022034