lsnu commited on
Commit
c725033
·
verified ·
1 Parent(s): 6e69f50

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. MODEL_AND_ARTIFACT_INDEX.md +47 -0
  2. README.md +363 -0
  3. code/VLAarchtests2_code/VLAarchtests/.pytest_cache/.gitignore +2 -0
  4. code/VLAarchtests2_code/VLAarchtests/.pytest_cache/CACHEDIR.TAG +4 -0
  5. code/VLAarchtests2_code/VLAarchtests/.pytest_cache/README.md +8 -0
  6. code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/lastfailed +1 -0
  7. code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/nodeids +11 -0
  8. code/VLAarchtests2_code/VLAarchtests/artifacts/generated_configs/public_benchmark_package_v1.json +80 -0
  9. code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-310.pyc +0 -0
  10. code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-311.pyc +0 -0
  11. code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/base.cpython-310.pyc +0 -0
  12. code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/procedural_envs.cpython-310.pyc +0 -0
  13. code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/proxy_specs.cpython-310.pyc +0 -0
  14. docs/maniskill_pickclutter_correction_log_2026-04-01.md +187 -0
  15. docs/minimum_sign_of_life_maniskill_pickclutter_run_2026-04-01.md +134 -0
  16. docs/public_benchmark_progress_2026-04-01.md +91 -0
  17. docs/public_bridge_smoke_run_log_2026-04-01.md +116 -0
  18. reports/anchor_dual_push_smoke/original_trunk/rollout_eval.partial.json +29 -0
  19. reports/anybimanual_anchor_bridge_live/trunk_only_ep5/stderr.txt +20 -0
  20. reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_active_ft_seed23.json +131 -0
  21. reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_noop_seed23.json +110 -0
  22. reports/maniskill_bag_bridge_val_sweep_seed23/conservative/run.log +76 -0
  23. reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_active_ft_seed23.json +131 -0
  24. reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_noop_seed23.json +110 -0
  25. reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.json +60 -0
  26. reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.md +15 -0
  27. reports/maniskill_bag_bridge_val_sweep_seed23/default/run.log +76 -0
  28. reports/maniskill_bag_bridge_val_sweep_seed23/default/trunk_only_ft_seed23.json +131 -0
  29. reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/public_benchmark_package_summary.md +15 -0
  30. reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/trunk_only_ft_seed23.json +131 -0
  31. reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/adapter_noop_seed23.json +110 -0
  32. reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.json +60 -0
  33. reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.md +15 -0
  34. reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/run.log +76 -0
  35. reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/trunk_only_ft_seed23.json +131 -0
  36. reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed17.json +509 -0
  37. reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed23.json +509 -0
  38. reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed29.json +509 -0
  39. reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed17.json +488 -0
  40. reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed23.json +488 -0
  41. reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed29.json +488 -0
  42. reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.json +60 -0
  43. reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.md +15 -0
  44. reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed17.json +509 -0
  45. reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed23.json +509 -0
  46. reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed29.json +509 -0
  47. reports/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17.json +508 -0
  48. reports/maniskill_pickclutter_smoke_v2/adapter_noop_seed17.json +508 -0
  49. reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.json +62 -0
  50. reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.md +14 -0
MODEL_AND_ARTIFACT_INDEX.md ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model And Artifact Index
2
+
3
+ ## Main Code Roots
4
+
5
+ - `code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/`
6
+ - `code/VLAarchtests2_code/VLAarchtests/tests/`
7
+
8
+ ## Main Prior Handoff Roots
9
+
10
+ - `artifacts/`
11
+ - `docs/`
12
+ - `legacy/`
13
+ - `setup/`
14
+
15
+ ## Main Current Public Benchmark Roots
16
+
17
+ - `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/`
18
+ - strongest current dense-occlusion result
19
+ - `reports/maniskill_bag_bridge_eval_less_bonus_seed17/`
20
+ - `reports/maniskill_bag_bridge_eval_less_bonus_seed23/`
21
+ - `reports/maniskill_bag_bridge_eval_less_bonus_2seed_manual_summary.json`
22
+ - `reports/maniskill_cloth_bridge_smoke_v1/`
23
+ - `reports/maniskill_cloth_bridge_val_sweep_seed23/`
24
+
25
+ ## Main Current Checkpoint Roots
26
+
27
+ - `outputs/maniskill_pickclutter_smoke_v5/`
28
+ - `outputs/maniskill_bag_bridge_smoke_v1/`
29
+ - `outputs/maniskill_cloth_bridge_smoke_v1/`
30
+
31
+ ## Main Current Dataset Roots
32
+
33
+ - `data/maniskill_pickclutter/`
34
+ - `data/maniskill_bridge_retrieval/`
35
+ - `data/reveal_proxy/`
36
+
37
+ ## Main Current Docs
38
+
39
+ - `docs/maniskill_pickclutter_correction_log_2026-04-01.md`
40
+ - `docs/public_bridge_smoke_run_log_2026-04-01.md`
41
+ - `docs/minimum_sign_of_life_maniskill_pickclutter_run_2026-04-01.md`
42
+
43
+ ## Repo History
44
+
45
+ - `history/VLAarchtests_previous_README.md`
46
+ - `history/VLAarchtests2_previous_README.md`
47
+ - `history/VLAarchtests3_previous_README.md`
README.md ADDED
@@ -0,0 +1,363 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # VLAarchtests4
2
+
3
+ `VLAarchtests4` is the fresh organization repo for the RunPod work staged from `/workspace` on `2026-04-01 UTC`.
4
+
5
+ It carries forward the earlier repo lineage and adds the current public-sim benchmark package work:
6
+
7
+ - `VLAarchtests`
8
+ - early proxy + RLBench architecture search, handoff checkpoints, and environment recreation files from the `2026-03-25/26` sessions
9
+ - `VLAarchtests2`
10
+ - larger exploratory organization repo with more baselines, overlap/anchor work, frequent model changes, mixed artifacts, and several results that required later reinterpretation
11
+ - `VLAarchtests3`
12
+ - cleaned export focused on the elastic-occlusion `trunk + structured adapter + no-op fallback` refactor, validated tests, current checkpoints, and handoff docs
13
+ - `VLAarchtests4`
14
+ - keeps the `VLAarchtests3` export intact and adds the full current workspace `reports/`, `outputs/`, and `data/` trees, including all public benchmark smoke runs, checkpoint directories, dataset bundles, validation sweeps, and environment snapshots from the public-sim evaluation pass
15
+
16
+ ## What This Repo Adds
17
+
18
+ The main new addition in this repo is the public benchmark track work for the elastic-occlusion adapter:
19
+
20
+ - real public-sim smoke runs on:
21
+ - ManiSkill `PickClutterYCB-v1` as the dense occluded retrieval proxy
22
+ - ManiSkill bridge basket retrieval proxy as the bag retrieval proxy
23
+ - ManiSkill bridge cloth retrieval proxy as the folded-cloth retrieval proxy
24
+ - the public benchmark package code and summaries
25
+ - the train/eval logs, checkpoints, cached datasets, validation sweeps, and correction logs for those runs
26
+ - the same-machine environment snapshot for the public benchmark stack used on this RunPod
27
+
28
+ ## Top-Level Contents
29
+
30
+ - `code/`
31
+ - the cleaned code snapshot inherited from `VLAarchtests3`
32
+ - `artifacts/`
33
+ - prior staged checkpoints, proxy data, reports, and generated configs already bundled by `VLAarchtests3`
34
+ - `docs/`
35
+ - prior handoff/audit docs plus the current public benchmark run logs and correction notes
36
+ - `legacy/`
37
+ - older exact artifacts preserved by `VLAarchtests3`
38
+ - `setup/`
39
+ - prior environment files plus a new public benchmark environment snapshot under `setup/public_benchmark/`
40
+ - `history/`
41
+ - copied README history for `VLAarchtests`, `VLAarchtests2`, and `VLAarchtests3`
42
+ - `reports/`
43
+ - the full current `/workspace/workspace/reports` tree from this machine
44
+ - `outputs/`
45
+ - the full current `/workspace/workspace/outputs` tree from this machine
46
+ - `data/`
47
+ - the full current `/workspace/workspace/data` tree from this machine
48
+ - `PUBLIC_BENCHMARK_RESULTS.md`
49
+ - compact index of all public benchmark train/eval results from this session
50
+ - `MODEL_AND_ARTIFACT_INDEX.md`
51
+ - practical map of the main artifact roots to start from
52
+
53
+ ## Architecture State Carried Forward
54
+
55
+ The core model family inherited from `VLAarchtests3` is still:
56
+
57
+ - `trunk_only`
58
+ - `adapter_noop`
59
+ - `adapter_active`
60
+
61
+ The important architectural state carried into the public benchmark work is:
62
+
63
+ - wrapped-policy interface with exact `trunk_only`, `adapter_noop`, and `adapter_active` modes
64
+ - structured reveal/retrieve adapter with:
65
+ - state prediction
66
+ - task-routed proposal families
67
+ - retrieve-feasibility gating
68
+ - lightweight transition model
69
+ - planner/reranker
70
+ - planner fixes that replaced hard vetoes with softer stage penalties in:
71
+ - `code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/models/planner.py`
72
+
73
+ ## Public Benchmark Summary
74
+
75
+ Detailed per-run results are in `PUBLIC_BENCHMARK_RESULTS.md`. The short version is:
76
+
77
+ ### 1. Dense occluded retrieval proxy
78
+
79
+ Benchmark:
80
+
81
+ - ManiSkill `PickClutterYCB-v1`
82
+
83
+ Best current held-out result:
84
+
85
+ - directory:
86
+ - `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/`
87
+ - summary:
88
+ - `trunk_only_ft = 0.04`
89
+ - `adapter_noop = 0.04`
90
+ - `adapter_active_ft = 0.62`
91
+ - `delta_active_vs_trunk = +0.58`
92
+ - `95% CI = [0.44, 0.72]`
93
+ - `intervention_rate = 1.0`
94
+ - `non_base_selection_rate = 1.0`
95
+
96
+ Important caveat:
97
+
98
+ - this was not a new retrain after `smoke_v5`
99
+ - it used the same `smoke_v5` checkpoints with planner hyperparameters selected on the frozen validation split and then applied once to the untouched held-out split
100
+
101
+ ### 2. Bag retrieval proxy
102
+
103
+ Benchmark:
104
+
105
+ - public ManiSkill bridge basket retrieval proxy
106
+
107
+ Current fair read:
108
+
109
+ - seed `17` corrected held-out:
110
+ - `trunk = 0.32`
111
+ - `noop = 0.00`
112
+ - `active = 0.48`
113
+ - seed `23` corrected held-out:
114
+ - `trunk = 0.48`
115
+ - `noop = 0.08`
116
+ - `active = 0.48`
117
+ - corrected 2-seed aggregate:
118
+ - `trunk = 0.40`
119
+ - `noop = 0.04`
120
+ - `active = 0.48`
121
+ - `delta = +0.08`
122
+
123
+ Interpretation:
124
+
125
+ - bag remains modestly positive after using one consistent corrected planner across seeds
126
+ - the effect is smaller and less clean than the best occlusion result
127
+
128
+ ### 3. Cloth retrieval proxy
129
+
130
+ Benchmark:
131
+
132
+ - public ManiSkill bridge cloth retrieval proxy
133
+
134
+ Current read:
135
+
136
+ - seed `17`:
137
+ - `trunk = 0.04`
138
+ - `noop = 0.04`
139
+ - `active = 0.10`
140
+ - seed `23`:
141
+ - `trunk = 0.04`
142
+ - `noop = 0.02`
143
+ - `active = 0.02`
144
+ - seed `29`:
145
+ - `trunk = 0.04`
146
+ - `noop = 0.04`
147
+ - `active = 0.04`
148
+ - 3-seed aggregate:
149
+ - `trunk = 0.0400`
150
+ - `noop = 0.0333`
151
+ - `active = 0.0533`
152
+ - `delta = +0.0133`
153
+
154
+ Interpretation:
155
+
156
+ - cloth is weak and unstable
157
+ - current evidence does not support a strong cloth-specific win
158
+
159
+ ## Important Fairness Notes
160
+
161
+ The fairness story is mixed and should be stated plainly.
162
+
163
+ What is fair in the strongest public benchmark result:
164
+
165
+ - same initialization checkpoint for `trunk_only_ft` and `adapter_active_ft`
166
+ - same train/val/test split within each task
167
+ - same optimizer, LR, batch size, and unfreeze scope within each task
168
+ - `adapter_noop` is evaluated from the same adapter checkpoint as `adapter_active_ft`
169
+ - the held-out test episodes were not hand-picked after seeing outcomes
170
+
171
+ What is not fully paper-clean yet:
172
+
173
+ - most current public benchmark evidence is smoke-scale and low-seed
174
+ - the occlusion headline result depends on validation-selected planner tuning on top of a fixed checkpoint
175
+ - bag required eval-side planner correction for one seed to avoid a collapse
176
+ - cloth remains weak even after additional seeds and val sweeps
177
+
178
+ ### PickClutter Split Fairness
179
+
180
+ The important point for the dense-occlusion track is that the dataset split did not drift across the early smoke versions.
181
+
182
+ - `data/maniskill_pickclutter/smoke_v1/episode_splits.json`
183
+ - `data/maniskill_pickclutter/smoke_v2/episode_splits.json`
184
+ - `data/maniskill_pickclutter/smoke_v3/episode_splits.json`
185
+
186
+ These files contain the same episode ids:
187
+
188
+ - train: `170000..170031`
189
+ - val: `171000..171007`
190
+ - eval: `172000..172049`
191
+
192
+ Also:
193
+
194
+ - there is no `data/maniskill_pickclutter/smoke_v4/`
195
+ - there is no `data/maniskill_pickclutter/smoke_v5/`
196
+
197
+ `smoke_v4` and `smoke_v5` were code/report version labels, not new held-out episode bundles.
198
+
199
+ ### What Changed Across PickClutter Versions
200
+
201
+ The big changes across `smoke_v2`, `smoke_v3`, `smoke_v4`, and `smoke_v5` were:
202
+
203
+ - more benchmark-derived state supervision
204
+ - transition-model training enablement
205
+ - planner bug fixes
206
+ - fairness fixes so the adapter checkpoint did not hide a stronger shared trunk
207
+ - then a frozen-validation planner sweep for the final held-out eval
208
+
209
+ The big occlusion win was not caused by changing the eval episodes.
210
+
211
+ ## Crucial Caveats
212
+
213
+ ### Occlusion result was planner-tuned
214
+
215
+ The large jump in:
216
+
217
+ - `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/`
218
+
219
+ came from validation-selected planner tuning on top of the same `smoke_v5` checkpoint.
220
+
221
+ The selected override values were:
222
+
223
+ - `mode_preference_bonus = 0.75`
224
+ - `premature_retrieve_penalty = 0.5`
225
+ - `premature_insert_penalty = 0.25`
226
+ - `premature_maintain_penalty = 1.0`
227
+ - `occlusion_maintain_gap_min_access = 0.30`
228
+ - `occlusion_maintain_gap_min_visibility = 0.20`
229
+ - `retrieve_stage_access_threshold = 0.18`
230
+ - `retrieve_stage_reveal_threshold = 0.18`
231
+ - `retrieve_stage_support_threshold = 0.18`
232
+
233
+ That was a validation-only selection step. It was not a fresh retrain.
234
+
235
+ ### Bag and cloth did not use real depth
236
+
237
+ The bridge-task runner for the bag and cloth proxies used:
238
+
239
+ - one real RGB camera
240
+ - copied into all camera slots
241
+ - zero-filled depth channels
242
+
243
+ The runner labels this stack:
244
+
245
+ - `rgb_triplicate_zero_depth`
246
+
247
+ This is a real limitation and it should not be hidden.
248
+
249
+ It happened because the bridge proxy runner used a compatibility shim to satisfy the shared multi-camera tensor interface without plumbing real bridge-scene multiview depth through the stack.
250
+
251
+ Consequences:
252
+
253
+ - bag and cloth are not modality-matched to the PickClutter runs
254
+ - PickClutter used real `rgbd_3cam`
255
+ - bag and cloth used weaker perception input
256
+
257
+ ### Bag and cloth also used a different control wrapper
258
+
259
+ PickClutter:
260
+
261
+ - observation stack: `rgbd_3cam`
262
+ - action space: `bimanual_delta_pose`
263
+
264
+ Bag and cloth:
265
+
266
+ - observation stack: `rgb_triplicate_zero_depth`
267
+ - action space: `widowx_delta_pose`
268
+
269
+ So the cross-track story is architecture-consistent but not fully input/control-identical.
270
+
271
+ ### `smoke_v4_evalprobe_fromv3` is not a clean retrain result
272
+
273
+ This run:
274
+
275
+ - `reports/maniskill_pickclutter_smoke_v4_evalprobe_fromv3/`
276
+
277
+ used corrected planner logic on top of `smoke_v3` weights. It is useful evidence that the active adapter can matter, but it is not a clean end-to-end retrain.
278
+
279
+ ## What Was Actually Learned
280
+
281
+ The current repo supports the following claims:
282
+
283
+ - the structured adapter is still alive
284
+ - the active branch can clearly matter on a real public dense-occlusion benchmark proxy
285
+ - `adapter_noop` remains a useful fairness control
286
+ - bag-like retrieval still shows modest positive evidence
287
+ - cloth-like retrieval is currently the weak link
288
+
289
+ It does not support the following stronger claims yet:
290
+
291
+ - broad superiority on realistic manipulation benchmarks
292
+ - stable multi-seed wins across all three target-like public proxy tracks
293
+ - a clean modality-matched comparison across occlusion, bag, and cloth
294
+
295
+ ## Environment And Setup
296
+
297
+ Two environment stories exist in this repo.
298
+
299
+ ### Prior `VLAarchtests3` / RLBench stack
300
+
301
+ Preserved under:
302
+
303
+ - `setup/ENVIRONMENT.md`
304
+ - `setup/env_vars.sh`
305
+ - `setup/rlbench_pip_freeze.txt`
306
+
307
+ This is the older RLBench / AnyBimanual oriented environment.
308
+
309
+ ### Current public benchmark stack
310
+
311
+ Preserved under:
312
+
313
+ - `setup/public_benchmark/ENVIRONMENT.md`
314
+ - `setup/public_benchmark/env_vars.sh`
315
+ - `setup/public_benchmark/python_version.txt`
316
+ - `setup/public_benchmark/uname.txt`
317
+ - `setup/public_benchmark/nvidia_smi.txt`
318
+ - `setup/public_benchmark/gpu_short.txt`
319
+ - `setup/public_benchmark/pip_freeze_python311.txt`
320
+ - `setup/public_benchmark/rlbench_env_pip_freeze.txt`
321
+ - `setup/public_benchmark/hf_env.txt`
322
+
323
+ The public benchmark runs in this session were assembled on:
324
+
325
+ - GPU: `NVIDIA L40S`
326
+ - VRAM: `46068 MiB`
327
+ - driver: `580.126.09`
328
+ - Python: `3.11.10`
329
+ - kernel: `Linux 6.8.0-88-generic`
330
+
331
+ ## Recommended Starting Points
332
+
333
+ If you want the strongest current public benchmark evidence, start here:
334
+
335
+ - `docs/maniskill_pickclutter_correction_log_2026-04-01.md`
336
+ - `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
337
+
338
+ If you want the bag/cloth public bridge follow-up, start here:
339
+
340
+ - `docs/public_bridge_smoke_run_log_2026-04-01.md`
341
+ - `reports/maniskill_bag_bridge_eval_less_bonus_2seed_manual_summary.json`
342
+ - `reports/maniskill_cloth_bridge_val_sweep_seed23/summary.json`
343
+
344
+ If you want the repo lineage context, start here:
345
+
346
+ - `history/VLAarchtests_previous_README.md`
347
+ - `history/VLAarchtests2_previous_README.md`
348
+ - `history/VLAarchtests3_previous_README.md`
349
+
350
+ ## Bottom Line
351
+
352
+ This repo is the complete organization package for the current workspace state.
353
+
354
+ It includes:
355
+
356
+ - the `VLAarchtests3` export base
357
+ - the full current machine `reports/`, `outputs/`, and `data/` trees
358
+ - the public benchmark code, datasets, checkpoints, and results
359
+ - the environment files needed to stand up the same stack on similar hardware
360
+
361
+ Use it as the archival handoff state for continuing the elastic-occlusion adapter work.
362
+
363
+ Do not cite it as if all three target-like public proxy tracks are already cleanly solved. The occlusion track is the strongest current evidence; bag is modest; cloth remains weak; and the bridge-task perception stack still needs a proper real-depth rewrite.
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/.gitignore ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ # Created by pytest automatically.
2
+ *
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/CACHEDIR.TAG ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ Signature: 8a477f597d28d172789f06886806bc55
2
+ # This file is a cache directory tag created by pytest.
3
+ # For information about cache directory tags, see:
4
+ # https://bford.info/cachedir/spec.html
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/README.md ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ # pytest cache directory #
2
+
3
+ This directory contains data from the pytest's cache plugin,
4
+ which provides the `--lf` and `--ff` options, as well as the `cache` fixture.
5
+
6
+ **Do not** commit this to version control.
7
+
8
+ See [the docs](https://docs.pytest.org/en/stable/how-to/cache.html) for more information.
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/lastfailed ADDED
@@ -0,0 +1 @@
 
 
1
+ {}
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/nodeids ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ "tests/test_eval_toggle_paths_work.py::test_eval_toggle_paths_work",
3
+ "tests/test_general_eval_protocol_is_identical.py::test_general_eval_protocol_is_identical_across_modes",
4
+ "tests/test_public_benchmark_package_summary.py::test_public_benchmark_package_detects_training_mismatch",
5
+ "tests/test_public_benchmark_package_summary.py::test_public_benchmark_package_summary_passes_with_clear_gain",
6
+ "tests/test_public_benchmark_package_tracks.py::test_public_anchor_protocol_identity_is_mode_invariant",
7
+ "tests/test_public_benchmark_package_tracks.py::test_public_benchmark_package_contains_expected_tracks",
8
+ "tests/test_public_benchmark_package_tracks.py::test_public_target_protocol_identity_is_mode_invariant",
9
+ "tests/test_public_benchmark_package_tracks.py::test_public_track_roles_are_partitioned",
10
+ "tests/test_public_benchmark_package_tracks.py::test_training_fairness_signature_matches_for_trunk_and_adapter"
11
+ ]
code/VLAarchtests2_code/VLAarchtests/artifacts/generated_configs/public_benchmark_package_v1.json ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "anchor_eval_modes": [
3
+ "trunk_only",
4
+ "adapter_noop",
5
+ "adapter_active"
6
+ ],
7
+ "anchor_track_ids": [
8
+ "anchor_track"
9
+ ],
10
+ "defaults": {
11
+ "anchor_episodes": 25,
12
+ "resolution": 256,
13
+ "target_test_episodes": 100,
14
+ "target_train_demos": 64,
15
+ "target_val_demos": 16
16
+ },
17
+ "package_name": "public_reveal_retrieve_package_v1",
18
+ "target_eval_modes": [
19
+ "trunk_only_ft",
20
+ "adapter_noop",
21
+ "adapter_active_ft"
22
+ ],
23
+ "target_track_ids": [
24
+ "bag_track",
25
+ "occlusion_track",
26
+ "cloth_track"
27
+ ],
28
+ "thresholds": {
29
+ "anchor_tolerance": 0.02,
30
+ "sign_of_life_intervention_rate": 0.15,
31
+ "sign_of_life_non_base_selection_rate": 0.15,
32
+ "sign_of_life_success_gain": 0.05
33
+ },
34
+ "tracks": [
35
+ {
36
+ "benchmark_task": "unpacking_childs_bag-0",
37
+ "notes": "Closest public bag retrieval task. Treat as the benchmark-standard bag opening / retrieval slice.",
38
+ "public_source": "https://behavior.stanford.edu/knowledgebase/tasks/",
39
+ "role": "target",
40
+ "success_metric": "success_rate",
41
+ "suite": "behavior1k",
42
+ "target_behavior": "retrieve target objects from an opened compliant bag or backpack",
43
+ "task_family": "bag_retrieval",
44
+ "track_id": "bag_track"
45
+ },
46
+ {
47
+ "benchmark_task": "PickClutterYCB-v1",
48
+ "notes": "Closest maintained public occluded retrieval task. Treat as the canopy / dense occlusion proxy.",
49
+ "public_source": "https://maniskill.readthedocs.io/en/latest/tasks/table_top_gripper/index.html",
50
+ "role": "target",
51
+ "success_metric": "success_rate",
52
+ "suite": "maniskill3",
53
+ "target_behavior": "retrieve a target object from dense occluding clutter",
54
+ "task_family": "dense_occluded_retrieval",
55
+ "track_id": "occlusion_track"
56
+ },
57
+ {
58
+ "benchmark_task": "grasp_protocol_stacked_garment",
59
+ "notes": "Use the GarmentLab grasp protocol in stacked/clutter layouts as the closest public cloth retrieval benchmark slice.",
60
+ "public_source": "https://garmentlab.readthedocs.io/en/latest/tutorial/realworldbenchmark/index.html",
61
+ "role": "target",
62
+ "success_metric": "success_rate",
63
+ "suite": "garmentlab",
64
+ "target_behavior": "retrieve a hidden or partially covered object from stacked or cluttered garments",
65
+ "task_family": "cloth_retrieval",
66
+ "track_id": "cloth_track"
67
+ },
68
+ {
69
+ "benchmark_task": "dual_push_buttons",
70
+ "notes": "Trusted public anchor on this setup. Keep as a no-regression track only.",
71
+ "public_source": "https://arxiv.org/abs/2412.06779",
72
+ "role": "anchor",
73
+ "success_metric": "success_rate",
74
+ "suite": "anybimanual",
75
+ "target_behavior": "generic bimanual control regression anchor",
76
+ "task_family": "generic_anchor",
77
+ "track_id": "anchor_track"
78
+ }
79
+ ]
80
+ }
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-310.pyc ADDED
Binary file (615 Bytes). View file
 
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-311.pyc ADDED
Binary file (726 Bytes). View file
 
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/base.cpython-310.pyc ADDED
Binary file (1.41 kB). View file
 
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/procedural_envs.cpython-310.pyc ADDED
Binary file (42.5 kB). View file
 
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/proxy_specs.cpython-310.pyc ADDED
Binary file (4.28 kB). View file
 
docs/maniskill_pickclutter_correction_log_2026-04-01.md ADDED
@@ -0,0 +1,187 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ManiSkill PickClutter Correction Log (2026-04-01)
2
+
3
+ ## Scope
4
+
5
+ Public benchmark:
6
+
7
+ - ManiSkill 3 `PickClutterYCB-v1`
8
+
9
+ Frozen public split reused across all runs:
10
+
11
+ - train demos: `32` episodes
12
+ - val demos: `8` episodes
13
+ - eval episodes: `50`
14
+ - seed: `17`
15
+ - data bundle: `/workspace/workspace/data/maniskill_pickclutter/smoke_v3`
16
+
17
+ Fair comparison modes:
18
+
19
+ - `trunk_only_ft`
20
+ - `adapter_noop`
21
+ - `adapter_active_ft`
22
+
23
+ ## Code Changes
24
+
25
+ Runner changes:
26
+
27
+ - enabled candidate rollout supervision from real ManiSkill states
28
+ - enabled adapter transition-model training/eval
29
+ - unfroze `adapter.transition_model`
30
+ - set non-zero transition loss weight
31
+ - added ManiSkill smoke planner overrides for the occlusion proxy:
32
+ - `adapter_confidence_threshold=0.50`
33
+ - `retrieve_access_threshold=0.08`
34
+ - `retrieve_persistence_threshold=0.12`
35
+ - `retrieve_support_threshold=0.08`
36
+ - `retrieve_reocclusion_threshold=0.92`
37
+
38
+ Planner correction:
39
+
40
+ - changed adapter stage rules from hard vetoes to soft penalties in
41
+ `/workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/models/planner.py`
42
+
43
+ ## Runs
44
+
45
+ ### 1. `smoke_v3` corrected-train baseline
46
+
47
+ Artifacts:
48
+
49
+ - summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v3/public_benchmark_package_summary.json`
50
+
51
+ Result:
52
+
53
+ - `trunk_only_ft=0.06`
54
+ - `adapter_noop=0.06`
55
+ - `adapter_active_ft=0.06`
56
+ - `intervention_rate=0.0`
57
+ - `non_base_selection_rate=0.0`
58
+
59
+ Interpretation:
60
+
61
+ - rollout supervision and transition-model training alone were not enough
62
+ - the adapter remained inert
63
+
64
+ ### 2. `smoke_v4_evalprobe_fromv3` corrected-planner eval on `smoke_v3` weights
65
+
66
+ Artifacts:
67
+
68
+ - summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v4_evalprobe_fromv3/public_benchmark_package_summary.json`
69
+
70
+ Result:
71
+
72
+ - `trunk_only_ft=0.06`
73
+ - `adapter_noop=0.06`
74
+ - `adapter_active_ft=0.62`
75
+ - `delta_active_vs_trunk=+0.56`
76
+ - `95% CI=[+0.40, +0.70]`
77
+ - `intervention_rate=1.0`
78
+ - `non_base_selection_rate=1.0`
79
+
80
+ Interpretation:
81
+
82
+ - this is the first real adapter-specific sign of life on the public benchmark
83
+ - the corrected planner logic is doing the work
84
+ - the improvement is not coming from the shared trunk, because `adapter_noop` stayed at `0.06`
85
+
86
+ ### 3. `smoke_v4` clean retrain with corrected planner active during train and eval
87
+
88
+ Artifacts:
89
+
90
+ - summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v4/public_benchmark_package_summary.json`
91
+
92
+ Result:
93
+
94
+ - `trunk_only_ft=0.48`
95
+ - `adapter_noop=0.04`
96
+ - `adapter_active_ft=0.04`
97
+ - `intervention_rate=1.0`
98
+ - `non_base_selection_rate=1.0`
99
+ - `delta_active_vs_trunk=-0.44`
100
+
101
+ Interpretation:
102
+
103
+ - the clean retrain under corrected planner logic is unstable / regressive
104
+ - the adapter-trained checkpoint collapsed even though active mode intervened
105
+ - current evidence supports the corrected planner as a real eval-time model fix, but not yet as a stable retrain recipe
106
+
107
+ ### 4. `smoke_v5` fair retrain with trunk-action supervision preserved inside adapter training
108
+
109
+ Artifacts:
110
+
111
+ - summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5/public_benchmark_package_summary.json`
112
+
113
+ Result:
114
+
115
+ - `trunk_only_ft=0.04`
116
+ - `adapter_noop=0.04`
117
+ - `adapter_active_ft=0.04`
118
+ - `intervention_rate=1.0`
119
+ - `non_base_selection_rate=1.0`
120
+ - `delta_active_vs_trunk=0.00`
121
+
122
+ Interpretation:
123
+
124
+ - this fixed the fairness problem from `smoke_v4`: the adapter-trained checkpoint no longer hid a stronger trunk, because `adapter_noop` matched `trunk_only_ft`
125
+ - but the active branch still failed because the planner collapsed to `maintain_gap` on every decision
126
+
127
+ ### 5. `smoke_v5_val_sweep` and held-out `smoke_v5_eval_tuned_softerpref`
128
+
129
+ Artifacts:
130
+
131
+ - val sweep: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_val_sweep/summary.json`
132
+ - held-out summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
133
+
134
+ Val-selected planner override:
135
+
136
+ - `mode_preference_bonus=0.75`
137
+ - `premature_retrieve_penalty=0.5`
138
+ - `premature_insert_penalty=0.25`
139
+ - `premature_maintain_penalty=1.0`
140
+ - `occlusion_maintain_gap_min_access=0.30`
141
+ - `occlusion_maintain_gap_min_visibility=0.20`
142
+ - `retrieve_stage_access_threshold=0.18`
143
+ - `retrieve_stage_reveal_threshold=0.18`
144
+ - `retrieve_stage_support_threshold=0.18`
145
+
146
+ Validation result:
147
+
148
+ - `baseline_corrected=0.00`
149
+ - `soft_pref=0.00`
150
+ - `softer_pref=0.625`
151
+ - `retrieve_open=0.625`
152
+
153
+ Held-out result:
154
+
155
+ - `trunk_only_ft=0.04`
156
+ - `adapter_noop=0.04`
157
+ - `adapter_active_ft=0.62`
158
+ - `delta_active_vs_trunk=+0.58`
159
+ - `95% CI=[+0.44, +0.72]`
160
+ - `intervention_rate=1.0`
161
+ - `non_base_selection_rate=1.0`
162
+ - `steps_to_retrieve=1.0`
163
+ - `signs_of_life=true`
164
+
165
+ Interpretation:
166
+
167
+ - this is a fair held-out public-benchmark win on the dense-occlusion proxy
168
+ - the gain is adapter-specific because `adapter_noop` stayed flat with the trunk baseline
169
+ - the fixed checkpoint from `smoke_v5` was viable; the missing piece was planner-stage calibration on the frozen validation split
170
+
171
+ ## Current Best Public-Benchmark Evidence
172
+
173
+ Best adapter-specific evidence currently available:
174
+
175
+ - `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
176
+
177
+ Why this is the strongest result:
178
+
179
+ - same frozen public train/val/eval split
180
+ - same trained trunk baseline and adapter checkpoint
181
+ - planner override selected on the frozen validation split before the held-out eval run
182
+ - `adapter_noop` isolates the shared-trunk effect and stays flat
183
+ - only `adapter_active_ft` improves, so the gain is caused by live adapter intervention
184
+
185
+ ## Open Problem
186
+
187
+ The dense-occlusion proxy now has a fair held-out win, but bag-style and cloth-style public proxy tracks are still missing. The next work item is to bring up the next public proxy benchmark instead of re-running more occlusion-only sweeps.
docs/minimum_sign_of_life_maniskill_pickclutter_run_2026-04-01.md ADDED
@@ -0,0 +1,134 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Minimum Sign-of-Life Runbook: ManiSkill PickClutterYCB-v1
2
+
3
+ Date: 2026-04-01
4
+
5
+ ## Goal
6
+
7
+ Run one real public-benchmark smoke on ManiSkill `PickClutterYCB-v1` that fairly compares:
8
+
9
+ - `trunk_only_ft`
10
+ - `adapter_noop`
11
+ - `adapter_active_ft`
12
+
13
+ The target claim for this run is narrow:
14
+
15
+ - on dense occluded retrieval, the adapter should visibly intervene and beat the trunk-only control trained on the same data;
16
+ - this is a minimum-sign-of-life run, not the full 3-track package.
17
+
18
+ ## Correction After First Failed Smoke
19
+
20
+ The first smoke run confirmed that the real ManiSkill benchmark path worked, but the adapter stayed inert because the smoke dataset only supervised proposal ranking. The corrected run keeps the same benchmark and fairness contract and restarts both trained variants from the same init on the same frozen split, but adds benchmark-derived current-state supervision for the adapter:
21
+
22
+ - `support_mode`
23
+ - `corridor_feasible`
24
+ - `persistence_horizon`
25
+ - `disturbance_cost`
26
+ - selected task metrics that feed the adapter gate and mode bias
27
+ - `state_confidence_target`
28
+
29
+ This corrected artifact set is versioned as `smoke_v2`.
30
+
31
+ ## Fixed Protocol
32
+
33
+ ### Benchmark
34
+
35
+ - Public benchmark: ManiSkill `PickClutterYCB-v1`
36
+ - Track id: `occlusion_track`
37
+ - Task family label inside the adapter stack: `foliage`
38
+ - Resolution: `224`
39
+ - One seed for training: `17`
40
+
41
+ ### Data
42
+
43
+ - One benchmark-native scripted macro teacher collects the dataset once.
44
+ - The teacher also writes per-step scene-state labels from the same public benchmark state and candidate sweep.
45
+ - Train demos: `32`
46
+ - Val demos: `8`
47
+ - Held-out eval episodes: `50`
48
+ - The exact train, val, and eval episode ids/seeds are frozen once generated and written to disk.
49
+
50
+ ### Fairness Constraints
51
+
52
+ - Both trained conditions start from the same initialization checkpoint.
53
+ - Both use the same train/val split.
54
+ - Both use the same held-out eval episodes.
55
+ - Both use the same optimizer, batch size, LR, epoch budget, and random seed.
56
+ - Both fine-tune the same trunk submodules:
57
+ - fusion
58
+ - memory
59
+ - decoder
60
+ - The backbone stays frozen for both conditions.
61
+ - The only architectural difference is the presence of the structured adapter.
62
+ - `candidate0` remains the raw trunk action.
63
+ - `adapter_noop` is eval-only and is produced from the `adapter_active_ft` checkpoint.
64
+
65
+ ### Initialization
66
+
67
+ - Shared init checkpoint:
68
+ - `/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt`
69
+ - Load with shape filtering / `init_strict: false`.
70
+
71
+ ### Training Conditions
72
+
73
+ #### `trunk_only_ft`
74
+
75
+ - Policy type: `foundation_trunk`
76
+ - Trainable prefixes:
77
+ - `fusion`
78
+ - `memory`
79
+ - `decoder`
80
+
81
+ #### `adapter_active_ft`
82
+
83
+ - Policy type: `adapter_wrapped`
84
+ - Trainable prefixes:
85
+ - `trunk.fusion`
86
+ - `trunk.memory`
87
+ - `trunk.decoder`
88
+ - `adapter.state_head`
89
+ - `adapter.proposal_prior`
90
+ - `adapter.planner`
91
+ - Transition model: off for the smoke run
92
+
93
+ ### Evaluation Conditions
94
+
95
+ - `trunk_only_ft`: trained trunk checkpoint
96
+ - `adapter_noop`: adapter checkpoint in no-op mode
97
+ - `adapter_active_ft`: adapter checkpoint in active mode
98
+
99
+ ### Success Criteria
100
+
101
+ - Adapter success exceeds trunk-only success by at least `5` absolute points on the held-out `50` episodes.
102
+ - Adapter intervention rate is at least `15%`.
103
+ - Non-base selection rate is at least `15%`.
104
+ - Results are summarized through the public benchmark package reporter under the `occlusion_track`.
105
+
106
+ ## Planned Artifacts
107
+
108
+ ### Data
109
+
110
+ - `/workspace/workspace/data/maniskill_pickclutter/smoke_v2/train.pt`
111
+ - `/workspace/workspace/data/maniskill_pickclutter/smoke_v2/val.pt`
112
+ - `/workspace/workspace/data/maniskill_pickclutter/smoke_v2/episode_splits.json`
113
+
114
+ ### Train Outputs
115
+
116
+ - `/workspace/workspace/outputs/maniskill_pickclutter_smoke_v2/trunk_only_ft_seed17/`
117
+ - `/workspace/workspace/outputs/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17/`
118
+
119
+ ### Eval Outputs
120
+
121
+ - `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/trunk_only_ft_seed17.json`
122
+ - `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/adapter_noop_seed17.json`
123
+ - `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17.json`
124
+
125
+ ### Package Summary
126
+
127
+ - `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.json`
128
+ - `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.md`
129
+
130
+ ## Notes
131
+
132
+ - This run is intentionally limited to the fastest credible public target track.
133
+ - No custom benchmark or custom teleop suite is allowed for this smoke.
134
+ - If the ManiSkill runtime or macro controller requires repairs, the repairs must preserve the fairness constraints above.
docs/public_benchmark_progress_2026-04-01.md ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ## Public Benchmark Progress
2
+
3
+ Date: 2026-04-01 UTC
4
+
5
+ ### Confirmed Real Public Benchmark Result
6
+
7
+ - Public occlusion proxy: `ManiSkill PickClutterYCB-v1`
8
+ - Strongest adapter-specific result so far:
9
+ - summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
10
+ - `trunk_only_ft = 0.04`
11
+ - `adapter_noop = 0.04`
12
+ - `adapter_active_ft = 0.62`
13
+ - `delta_active_vs_trunk = +0.58`
14
+ - `95% CI = [0.44, 0.72]`
15
+ - `intervention_rate = 1.0`
16
+ - `non_base_selection_rate = 1.0`
17
+ - Interpretation:
18
+ - this is real adapter-specific sign of life on a public occlusion benchmark
19
+ - the gain is not coming from a stronger shared trunk, because `adapter_noop` stays flat
20
+
21
+ ### BEHAVIOR Bag Proxy Investigation
22
+
23
+ Target public task family:
24
+ - official BEHAVIOR grocery-store bag/container retrieval proxy
25
+ - primary candidate: `paying_for_purchases`
26
+ - stricter but currently unusable candidate: `buy_basic_garden_tools`
27
+
28
+ Environment used:
29
+ - BEHAVIOR assets: `/workspace/workspace/BEHAVIOR-1K`
30
+ - venv used for probes: `/workspace/envs/behavior`
31
+
32
+ Findings:
33
+ - `buy_basic_garden_tools` is blocked by official scene-task geometry:
34
+ - repeated failure on `ontop ['rake.n.03_1', 'grocery_shelf.n.01_1']`
35
+ - even with whitelist attempts, the sampler never found a valid shelf placement
36
+ - `paying_for_purchases` is much healthier:
37
+ - `grocery_store_convenience`, `grocery_store_cafe`, and `grocery_store_asian` all load
38
+ - object scope binds the real task objects:
39
+ - `shopping_basket.n.01_1`
40
+ - `money.n.01_1`
41
+ - `checkout.n.03_1`
42
+ - `floor.n.01_1`
43
+ - Root sampler bug:
44
+ - official online sampling fails on the floor / agent chain
45
+ - without patching, the blocking warning is:
46
+ - `Room type [grocery_store] ... floor.n.01_1: , checkout.n.03_1: grocery_store_0`
47
+ - after removing the agent-on-floor condition from the sampler pipeline, the next blocker is:
48
+ - `ontop ['shopping_basket.n.01_1', 'floor.n.01_1'] False`
49
+ - Critical state-probe result:
50
+ - even when object bindings exist, the sampled movable objects remain parked at their far-away import positions
51
+ - observed example on `grocery_store_asian`:
52
+ - basket position near `[120, 120, -80]`
53
+ - money position near `[115, 115, -85]`
54
+ - apples position near `[110, 110, -90]` and `[105, 105, -95]`
55
+ - `money inside basket = False`
56
+ - `apple1 inside basket = False`
57
+ - `apple2 inside basket = False`
58
+ - Conclusion:
59
+ - as of 2026-04-01, the BEHAVIOR bag proxy is not yet a usable fair evaluation track in this workspace
60
+ - the public task objects bind, but the online sampler does not materialize a valid initial scene for training or evaluation
61
+
62
+ ### Garment / Cloth Proxy Status
63
+
64
+ - GarmentLab repo cloned:
65
+ - `/workspace/workspace/GarmentLab`
66
+ - Immediate constraint:
67
+ - the repo expects Isaac Sim 4.0.0 plus external Google Drive assets
68
+ - Current status:
69
+ - code inspected only
70
+ - no runnable public cloth benchmark execution completed yet in this workspace
71
+
72
+ ### Next Public Proxy Candidates
73
+
74
+ Given the BEHAVIOR blocker, the next-lightest public candidates already available locally are:
75
+
76
+ - `OpenCabinetDrawer-v1`
77
+ - public ManiSkill task
78
+ - good container reveal / access proxy
79
+ - `PutEggplantInBasketScene-v1`
80
+ - public ManiSkill bridge-dataset task
81
+ - public basket / container interaction proxy
82
+ - `PutSpoonOnTableClothInScene-v1`
83
+ - public ManiSkill bridge-dataset cloth interaction proxy
84
+
85
+ ### Immediate Recommendation
86
+
87
+ - Keep the confirmed `PickClutterYCB-v1` result as the anchor public success case.
88
+ - Do not spend more time on BEHAVIOR online sampling until either:
89
+ - a cached valid scene instance is created, or
90
+ - the sampler is patched deeply enough to place container objects correctly instead of leaving them at far-away import positions.
91
+ - Pivot the next train/eval smoke to a lighter public ManiSkill proxy before returning to BEHAVIOR.
docs/public_bridge_smoke_run_log_2026-04-01.md ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Public Bridge Smoke Run Log
2
+
3
+ Date: 2026-04-01 UTC
4
+
5
+ ## Completed public proxy evidence
6
+
7
+ - Occlusion proxy already completed earlier on `PickClutterYCB-v1`.
8
+ - Best current occlusion report:
9
+ - `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
10
+ - `trunk_only_ft=0.04`
11
+ - `adapter_noop=0.04`
12
+ - `adapter_active_ft=0.62`
13
+ - `delta_active_vs_trunk=+0.58`
14
+ - `95% CI [0.44, 0.72]`
15
+ - `intervention_rate=1.0`
16
+ - `non_base_selection_rate=1.0`
17
+
18
+ - Bag proxy completed on the public ManiSkill bridge basket scene proxy.
19
+ - Bag report directory:
20
+ - `/workspace/workspace/reports/maniskill_bag_bridge_smoke_v1`
21
+ - Bag result summary:
22
+ - `trunk_only_ft=0.32`
23
+ - `adapter_noop=0.00`
24
+ - `adapter_active_ft=0.48`
25
+ - `delta_active_vs_trunk=+0.16`
26
+ - `delta_active_vs_trunk_ci95=[-0.04, 0.34]`
27
+ - `intervention_rate=1.0`
28
+ - `non_base_selection_rate=1.0`
29
+ - bag track `signs_of_life=true`
30
+ - package-level headline gate remains false at this single-seed smoke scale
31
+
32
+ ## Cloth proxy definition
33
+
34
+ - Public scene proxy:
35
+ - `PutSpoonOnTableClothInScene-v1`
36
+ - Fixed hidden-state initialization:
37
+ - spoon pose `[-0.235, -0.094, 0.8748]`
38
+ - cloth pose `[-0.235, -0.075, 0.885]`
39
+ - Deterministic valid-seed filter:
40
+ - accept only seeds whose initialized hidden state is below the visibility gate and solvable by scripted reveal+retrieve
41
+ - Reveal macros corrected to push-style actions:
42
+ - `lift_edge` = front push in `+y`
43
+ - `separate_layer` = side push in `+x`
44
+ - Cloth success metric corrected:
45
+ - based on spoon displacement from its own hidden start plus visibility
46
+ - no longer credits success merely because the cloth flies away
47
+
48
+ ## Important runner fixes already landed
49
+
50
+ - File:
51
+ - `/workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py`
52
+ - Fixed:
53
+ - cloth hidden-state initialization
54
+ - cloth seed filtering and split reuse via `episode_splits.json`
55
+ - `post_bundle` missing in cloth collect success check
56
+ - bridge smoke loss weights aligned to current `LossWeights`
57
+ - adapter trainable parameter prefixes aligned to working pickclutter runner
58
+ - zero-depth layout changed to channel-first
59
+ - cached dataset normalizer added for old channel-last depth tensors
60
+
61
+ ## Live status when this note was written
62
+
63
+ - Bag process is complete.
64
+ - Cloth process is still collecting the train split in the original long-running session.
65
+ - The long-running cloth process was started before the later loss-weight and depth-layout fixes, so it is expected to finish collection and then crash at training start.
66
+ - After it writes `train.pt` and `val.pt`, restart cloth with:
67
+
68
+ ```bash
69
+ python /workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py --task cloth --skip-collection
70
+ ```
71
+
72
+ - If trunk checkpoint already exists by that point and only adapter needs rerun:
73
+
74
+ ```bash
75
+ python /workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py --task cloth --skip-collection --reuse-checkpoints
76
+ ```
77
+
78
+ ## Cloth restart correction
79
+
80
+ - The corrected cloth restart reached adapter training and failed in rollout supervision because the cached cloth public proxy authored `7` candidate targets while the decoder always allocates `8` proposal slots.
81
+ - Fix landed in:
82
+ - `/workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py`
83
+ - Correction:
84
+ - cached bridge samples now normalize channel-last depth tensors as before
85
+ - cached candidate-aligned tensors now also pad from `7 -> 8` slots before loading
86
+ - padding cycles the non-base candidates first, which preserves the collected cloth episodes and avoids recollection
87
+ - Verified locally before restart:
88
+ - normalized cloth `candidate_action_chunks` is `(8, 8, 14)`
89
+ - normalized cloth `candidate_rollout_support_mode` is `(8, 5)`
90
+ - one real `adapter_active_ft` training step and one real validation loss pass both completed without the previous shape error
91
+
92
+ ## Cloth result
93
+
94
+ - Report directory:
95
+ - `/workspace/workspace/reports/maniskill_cloth_bridge_smoke_v1`
96
+ - Final cloth smoke summary:
97
+ - `trunk_only_ft = 0.04`
98
+ - `adapter_noop = 0.04`
99
+ - `adapter_active_ft = 0.10`
100
+ - `delta_active_vs_trunk = +0.06`
101
+ - `delta_active_vs_trunk_ci95 = [-0.04, 0.16]`
102
+ - `intervention_rate = 0.3369`
103
+ - `non_base_selection_rate = 0.2674`
104
+ - Interpretation:
105
+ - cloth proxy is positive and adapter-specific in this single-seed smoke because `adapter_noop` stayed flat while `adapter_active_ft` improved
106
+ - effect size is modest and not yet statistically clean in this smoke protocol
107
+
108
+ ## Combined three-track proxy suite
109
+
110
+ - Combined report:
111
+ - `/workspace/workspace/reports/public_proxy_suite_smoke_v1/combined_summary.json`
112
+ - `/workspace/workspace/reports/public_proxy_suite_smoke_v1/combined_summary.md`
113
+ - Current three-track smoke evidence:
114
+ - occlusion proxy positive and adapter-specific
115
+ - bag proxy positive and adapter-specific
116
+ - cloth proxy positive and adapter-specific
reports/anchor_dual_push_smoke/original_trunk/rollout_eval.partial.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "checkpoint": "/workspace/workspace/VLAarchtests2/outputs/rlbench_dual_push/rlbench_dual_push_backbone_only_clip_chunk8_weighted_seed17/checkpoint_best.pt",
3
+ "plan_requested": false,
4
+ "plan_applied": false,
5
+ "planner_mode": "trainable",
6
+ "support_mode_conditioning": true,
7
+ "task_conditioning": true,
8
+ "geometry_enabled": true,
9
+ "world_model_mode": "checkpoint_default",
10
+ "episodes_per_task": 5,
11
+ "episode_length": 120,
12
+ "resolution": 256,
13
+ "reset_retries": 20,
14
+ "arm_mode": "planning",
15
+ "delta_scale": 1.0,
16
+ "cameras": [
17
+ "front",
18
+ "wrist_left",
19
+ "wrist_right"
20
+ ],
21
+ "tasks": {
22
+ "bimanual_dual_push_buttons": {
23
+ "error": "The call failed on the V-REP side. Return value: -1",
24
+ "mean_success": 0.0,
25
+ "mean_return": 0.0
26
+ }
27
+ },
28
+ "mean_success": 0.0
29
+ }
reports/anybimanual_anchor_bridge_live/trunk_only_ep5/stderr.txt ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ /workspace/third_party/AnyBimanual/eval.py:183: UserWarning:
2
+ The version_base parameter is not specified.
3
+ Please specify a compatability version level, or None.
4
+ Will assume defaults for version 1.1
5
+ @hydra.main(config_name="eval", config_path="conf")
6
+ /workspace/envs/rlbench/lib/python3.10/site-packages/hydra/_internal/defaults_list.py:251: UserWarning: In 'eval': Defaults list is missing `_self_`. See https://hydra.cc/docs/1.2/upgrades/1.0_to_1.1/default_composition_order for more information
7
+ warnings.warn(msg, UserWarning)
8
+ /workspace/envs/rlbench/lib/python3.10/site-packages/hydra/core/default_element.py:124: UserWarning: In 'method/PERACT_BC': Usage of deprecated keyword in package header '# @package _group_'.
9
+ See https://hydra.cc/docs/1.2/upgrades/1.0_to_1.1/changes_to_package_header for more information
10
+ deprecation_warning(
11
+ /workspace/envs/rlbench/lib/python3.10/site-packages/hydra/_internal/hydra.py:119: UserWarning: Future Hydra versions will no longer change working directory at job runtime by default.
12
+ See https://hydra.cc/docs/1.2/upgrades/1.1_to_1.2/changes_to_job_working_dir/ for more information.
13
+ ret = run_job(
14
+ Error executing job with overrides: ['method=PERACT_BC', 'framework.logdir=/workspace/workspace/reports/anybimanual_anchor_bridge_live/trunk_only_ep5/anybimanual_logdir', 'framework.start_seed=0', 'framework.eval_type=60000', 'framework.eval_episodes=5', 'framework.eval_envs=1', 'framework.gpu=0', 'rlbench.task_name=perlf_release_dual_push_buttons_smoke5', 'rlbench.tasks=[dual_push_buttons]', 'rlbench.demo_path=/workspace/baselines/AnyBimanual_subset3_demo_root', 'rlbench.headless=True', 'rlbench.gripper_mode=BimanualDiscrete', 'rlbench.arm_action_mode=BimanualEndEffectorPoseViaPlanning', 'rlbench.action_mode=BimanualMoveArmThenGripper']
15
+ Traceback (most recent call last):
16
+ File "/workspace/third_party/AnyBimanual/eval.py", line 201, in main
17
+ raise Exception(f"Missing seed{start_seed}/config.yaml. Logdir is {logdir}")
18
+ Exception: Missing seed0/config.yaml. Logdir is /workspace/workspace/reports/anybimanual_anchor_bridge_live/trunk_only_ep5/anybimanual_logdir/perlf_release_dual_push_buttons_smoke5/PERACT_BC/seed0
19
+
20
+ Set the environment variable HYDRA_FULL_ERROR=1 for a complete stack trace.
reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_active_ft_seed23.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_active_ft",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 1,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0
17
+ ],
18
+ "success_rate": 0.125,
19
+ "intervention_rate": 0.0,
20
+ "non_base_selection_rate": 0.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": true,
52
+ "steps": 1,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": false,
84
+ "steps": 4,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "adapter_active_ft",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
110
+ "train_spec": {
111
+ "track_id": "bag_track",
112
+ "suite": "maniskill3",
113
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
114
+ "model_variant": "adapter_active_ft",
115
+ "seed": 23,
116
+ "train_demos": 32,
117
+ "val_demos": 8,
118
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
119
+ "optimizer": "adamw",
120
+ "learning_rate": 0.0001,
121
+ "lr_schedule": "constant",
122
+ "batch_size": 4,
123
+ "augmentations": "none",
124
+ "early_stopping_metric": "val_total",
125
+ "max_gradient_steps": 114,
126
+ "unfreeze_scope": "fusion_memory_decoder",
127
+ "dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
128
+ "same_data_policy": true,
129
+ "same_init_policy": true
130
+ }
131
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_noop_seed23.json ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_noop",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 1,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0
17
+ ],
18
+ "success_rate": 0.125,
19
+ "intervention_rate": 0.0,
20
+ "non_base_selection_rate": 0.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": true,
52
+ "steps": 1,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": false,
84
+ "steps": 4,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "adapter_noop",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone."
110
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/conservative/run.log ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
3
+ Key | Status | |
4
+ -------------------------------------+------------+--+-
5
+ vision_model.embeddings.position_ids | UNEXPECTED | |
6
+ text_model.embeddings.position_ids | UNEXPECTED | |
7
+
8
+ Notes:
9
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
10
+ CLIPTextTransformer does not expose input embeddings. Gradients cannot flow back to the token embeddings when using adapters or gradient checkpointing. Override `get_input_embeddings` to fully support those features, or set `_input_embed_layer` to the attribute name that holds the embeddings.
11
+ /usr/local/lib/python3.11/dist-packages/torch/nn/modules/transformer.py:307: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.norm_first was True
12
+ warnings.warn(f"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}")
13
+ 2026-04-01 11:27:44,182 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
14
+ 2026-04-01 11:27:44,237 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
15
+ 2026-04-01 11:27:44,250 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
16
+ 2026-04-01 11:27:44,918 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
17
+ 2026-04-01 11:27:44,920 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
18
+ 2026-04-01 11:27:44,920 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
19
+ /usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: WARN: env.get_obs to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_obs` for environment variables or `env.get_wrapper_attr('get_obs')` that will search the reminding wrappers.
20
+ logger.warn(
21
+ /usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: WARN: env.get_info to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_info` for environment variables or `env.get_wrapper_attr('get_info')` that will search the reminding wrappers.
22
+ logger.warn(
23
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171000, "success": false, "steps": 4}
24
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171001, "success": false, "steps": 4}
25
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171002, "success": false, "steps": 4}
26
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171003, "success": false, "steps": 4}
27
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171004, "success": false, "steps": 4}
28
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171005, "success": false, "steps": 4}
29
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171006, "success": false, "steps": 4}
30
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171007, "success": true, "steps": 1}
31
+
32
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
33
+ Key | Status | |
34
+ -------------------------------------+------------+--+-
35
+ vision_model.embeddings.position_ids | UNEXPECTED | |
36
+ text_model.embeddings.position_ids | UNEXPECTED | |
37
+
38
+ Notes:
39
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
40
+ 2026-04-01 11:28:17,937 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
41
+ 2026-04-01 11:28:17,940 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
42
+ 2026-04-01 11:28:17,940 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
43
+ 2026-04-01 11:28:18,161 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
44
+ 2026-04-01 11:28:18,164 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
45
+ 2026-04-01 11:28:18,164 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
46
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171000, "success": false, "steps": 4}
47
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171001, "success": false, "steps": 4}
48
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171002, "success": false, "steps": 4}
49
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171003, "success": true, "steps": 1}
50
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171004, "success": false, "steps": 4}
51
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171005, "success": false, "steps": 4}
52
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171006, "success": false, "steps": 4}
53
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171007, "success": false, "steps": 4}
54
+
55
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
56
+ Key | Status | |
57
+ -------------------------------------+------------+--+-
58
+ vision_model.embeddings.position_ids | UNEXPECTED | |
59
+ text_model.embeddings.position_ids | UNEXPECTED | |
60
+
61
+ Notes:
62
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
63
+ 2026-04-01 11:28:46,030 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
64
+ 2026-04-01 11:28:46,032 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
65
+ 2026-04-01 11:28:46,033 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
66
+ 2026-04-01 11:28:46,254 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
67
+ 2026-04-01 11:28:46,257 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
68
+ 2026-04-01 11:28:46,257 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
69
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171000, "success": false, "steps": 4}
70
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171001, "success": false, "steps": 4}
71
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171002, "success": false, "steps": 4}
72
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171003, "success": true, "steps": 1}
73
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171004, "success": false, "steps": 4}
74
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171005, "success": false, "steps": 4}
75
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171006, "success": false, "steps": 4}
76
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171007, "success": false, "steps": 4}
reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_active_ft_seed23.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_active_ft",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0
17
+ ],
18
+ "success_rate": 0.0,
19
+ "intervention_rate": 1.0,
20
+ "non_base_selection_rate": 1.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": false,
52
+ "steps": 4,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": false,
84
+ "steps": 4,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "adapter_active_ft",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
110
+ "train_spec": {
111
+ "track_id": "bag_track",
112
+ "suite": "maniskill3",
113
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
114
+ "model_variant": "adapter_active_ft",
115
+ "seed": 23,
116
+ "train_demos": 32,
117
+ "val_demos": 8,
118
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
119
+ "optimizer": "adamw",
120
+ "learning_rate": 0.0001,
121
+ "lr_schedule": "constant",
122
+ "batch_size": 4,
123
+ "augmentations": "none",
124
+ "early_stopping_metric": "val_total",
125
+ "max_gradient_steps": 114,
126
+ "unfreeze_scope": "fusion_memory_decoder",
127
+ "dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
128
+ "same_data_policy": true,
129
+ "same_init_policy": true
130
+ }
131
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_noop_seed23.json ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_noop",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 1,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0
17
+ ],
18
+ "success_rate": 0.125,
19
+ "intervention_rate": 0.0,
20
+ "non_base_selection_rate": 0.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": true,
52
+ "steps": 1,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": false,
84
+ "steps": 4,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "adapter_noop",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone."
110
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "anchor_pass": true,
3
+ "available_tracks": [
4
+ "bag_track"
5
+ ],
6
+ "ci_above_zero_tracks": [],
7
+ "headline_pass": false,
8
+ "package_name": "public_reveal_retrieve_package_v1",
9
+ "sign_of_life_pass": false,
10
+ "sign_of_life_track_count": 0,
11
+ "sign_of_life_tracks": [],
12
+ "target_macro_average_delta": -0.125,
13
+ "tracks": {
14
+ "bag_track": {
15
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
16
+ "delta_active_vs_trunk": -0.125,
17
+ "delta_active_vs_trunk_ci95": [
18
+ -0.375,
19
+ 0.0
20
+ ],
21
+ "delta_noop_vs_trunk": 0.0,
22
+ "modes": {
23
+ "adapter_active_ft": {
24
+ "disturbance_proxy": 0.0,
25
+ "intervention_rate": 1.0,
26
+ "mean_success": 0.0,
27
+ "non_base_selection_rate": 1.0,
28
+ "num_runs": 1,
29
+ "steps_to_first_reveal_or_access": 1.0,
30
+ "steps_to_retrieve": 4.0
31
+ },
32
+ "adapter_noop": {
33
+ "disturbance_proxy": 0.0,
34
+ "intervention_rate": 0.0,
35
+ "mean_success": 0.125,
36
+ "non_base_selection_rate": 0.0,
37
+ "num_runs": 1,
38
+ "steps_to_first_reveal_or_access": 1.0,
39
+ "steps_to_retrieve": 4.0
40
+ },
41
+ "trunk_only_ft": {
42
+ "disturbance_proxy": 0.0,
43
+ "intervention_rate": 0.0,
44
+ "mean_success": 0.125,
45
+ "non_base_selection_rate": 0.0,
46
+ "num_runs": 1,
47
+ "steps_to_first_reveal_or_access": 1.0,
48
+ "steps_to_retrieve": 4.0
49
+ }
50
+ },
51
+ "notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
52
+ "public_source": "ManiSkill public scene proxy: PutEggplantInBasketScene-v1",
53
+ "role": "target",
54
+ "signs_of_life": false,
55
+ "suite": "maniskill3",
56
+ "target_behavior": "retrieve the target object from inside the basket and stage it outside the basket",
57
+ "task_family": "bag_retrieval_proxy"
58
+ }
59
+ }
60
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.md ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ManiSkill Bag Retrieval Smoke Summary
2
+
3
+ - benchmark_task: PutEggplantInBasketRetrievalProxy-v1
4
+ - target_macro_average_delta: -0.125
5
+ - headline_pass: False
6
+ - sign_of_life_pass: False
7
+
8
+ ## bag_track
9
+ - delta_active_vs_trunk: -0.125
10
+ - delta_noop_vs_trunk: 0.000
11
+ - signs_of_life: False
12
+ - delta_active_vs_trunk_ci95: [-0.375, 0.000]
13
+ - trunk_only_ft: mean_success=0.125
14
+ - adapter_noop: mean_success=0.125
15
+ - adapter_active_ft: mean_success=0.000
reports/maniskill_bag_bridge_val_sweep_seed23/default/run.log ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
3
+ Key | Status | |
4
+ -------------------------------------+------------+--+-
5
+ vision_model.embeddings.position_ids | UNEXPECTED | |
6
+ text_model.embeddings.position_ids | UNEXPECTED | |
7
+
8
+ Notes:
9
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
10
+ CLIPTextTransformer does not expose input embeddings. Gradients cannot flow back to the token embeddings when using adapters or gradient checkpointing. Override `get_input_embeddings` to fully support those features, or set `_input_embed_layer` to the attribute name that holds the embeddings.
11
+ /usr/local/lib/python3.11/dist-packages/torch/nn/modules/transformer.py:307: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.norm_first was True
12
+ warnings.warn(f"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}")
13
+ 2026-04-01 11:24:45,511 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
14
+ 2026-04-01 11:24:45,572 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
15
+ 2026-04-01 11:24:45,576 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
16
+ 2026-04-01 11:24:46,297 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
17
+ 2026-04-01 11:24:46,300 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
18
+ 2026-04-01 11:24:46,300 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
19
+ /usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: WARN: env.get_obs to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_obs` for environment variables or `env.get_wrapper_attr('get_obs')` that will search the reminding wrappers.
20
+ logger.warn(
21
+ /usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: WARN: env.get_info to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_info` for environment variables or `env.get_wrapper_attr('get_info')` that will search the reminding wrappers.
22
+ logger.warn(
23
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171000, "success": false, "steps": 4}
24
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171001, "success": false, "steps": 4}
25
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171002, "success": false, "steps": 4}
26
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171003, "success": false, "steps": 4}
27
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171004, "success": false, "steps": 4}
28
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171005, "success": false, "steps": 4}
29
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171006, "success": false, "steps": 4}
30
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171007, "success": true, "steps": 1}
31
+
32
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
33
+ Key | Status | |
34
+ -------------------------------------+------------+--+-
35
+ vision_model.embeddings.position_ids | UNEXPECTED | |
36
+ text_model.embeddings.position_ids | UNEXPECTED | |
37
+
38
+ Notes:
39
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
40
+ 2026-04-01 11:25:18,652 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
41
+ 2026-04-01 11:25:18,655 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
42
+ 2026-04-01 11:25:18,655 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
43
+ 2026-04-01 11:25:18,873 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
44
+ 2026-04-01 11:25:18,875 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
45
+ 2026-04-01 11:25:18,875 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
46
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171000, "success": false, "steps": 4}
47
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171001, "success": false, "steps": 4}
48
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171002, "success": false, "steps": 4}
49
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171003, "success": true, "steps": 1}
50
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171004, "success": false, "steps": 4}
51
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171005, "success": false, "steps": 4}
52
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171006, "success": false, "steps": 4}
53
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171007, "success": false, "steps": 4}
54
+
55
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
56
+ Key | Status | |
57
+ -------------------------------------+------------+--+-
58
+ vision_model.embeddings.position_ids | UNEXPECTED | |
59
+ text_model.embeddings.position_ids | UNEXPECTED | |
60
+
61
+ Notes:
62
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
63
+ 2026-04-01 11:25:46,337 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
64
+ 2026-04-01 11:25:46,339 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
65
+ 2026-04-01 11:25:46,339 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
66
+ 2026-04-01 11:25:46,556 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
67
+ 2026-04-01 11:25:46,558 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
68
+ 2026-04-01 11:25:46,559 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
69
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171000, "success": false, "steps": 4}
70
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171001, "success": false, "steps": 4}
71
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171002, "success": false, "steps": 4}
72
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171003, "success": false, "steps": 4}
73
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171004, "success": false, "steps": 4}
74
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171005, "success": false, "steps": 4}
75
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171006, "success": false, "steps": 4}
76
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171007, "success": false, "steps": 4}
reports/maniskill_bag_bridge_val_sweep_seed23/default/trunk_only_ft_seed23.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "trunk_only_ft",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 1
17
+ ],
18
+ "success_rate": 0.125,
19
+ "intervention_rate": 0.0,
20
+ "non_base_selection_rate": 0.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": false,
52
+ "steps": 4,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": true,
84
+ "steps": 1,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "trunk_only_ft",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
110
+ "train_spec": {
111
+ "track_id": "bag_track",
112
+ "suite": "maniskill3",
113
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
114
+ "model_variant": "trunk_only_ft",
115
+ "seed": 23,
116
+ "train_demos": 32,
117
+ "val_demos": 8,
118
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
119
+ "optimizer": "adamw",
120
+ "learning_rate": 0.0001,
121
+ "lr_schedule": "constant",
122
+ "batch_size": 4,
123
+ "augmentations": "none",
124
+ "early_stopping_metric": "val_total",
125
+ "max_gradient_steps": 114,
126
+ "unfreeze_scope": "fusion_memory_decoder",
127
+ "dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
128
+ "same_data_policy": true,
129
+ "same_init_policy": true
130
+ }
131
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/public_benchmark_package_summary.md ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ManiSkill Bag Retrieval Smoke Summary
2
+
3
+ - benchmark_task: PutEggplantInBasketRetrievalProxy-v1
4
+ - target_macro_average_delta: 0.000
5
+ - headline_pass: False
6
+ - sign_of_life_pass: False
7
+
8
+ ## bag_track
9
+ - delta_active_vs_trunk: 0.000
10
+ - delta_noop_vs_trunk: 0.000
11
+ - signs_of_life: False
12
+ - delta_active_vs_trunk_ci95: [-0.375, 0.375]
13
+ - trunk_only_ft: mean_success=0.125
14
+ - adapter_noop: mean_success=0.125
15
+ - adapter_active_ft: mean_success=0.125
reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/trunk_only_ft_seed23.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "trunk_only_ft",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 1
17
+ ],
18
+ "success_rate": 0.125,
19
+ "intervention_rate": 0.0,
20
+ "non_base_selection_rate": 0.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": false,
52
+ "steps": 4,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": true,
84
+ "steps": 1,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "trunk_only_ft",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
110
+ "train_spec": {
111
+ "track_id": "bag_track",
112
+ "suite": "maniskill3",
113
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
114
+ "model_variant": "trunk_only_ft",
115
+ "seed": 23,
116
+ "train_demos": 32,
117
+ "val_demos": 8,
118
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
119
+ "optimizer": "adamw",
120
+ "learning_rate": 0.0001,
121
+ "lr_schedule": "constant",
122
+ "batch_size": 4,
123
+ "augmentations": "none",
124
+ "early_stopping_metric": "val_total",
125
+ "max_gradient_steps": 114,
126
+ "unfreeze_scope": "fusion_memory_decoder",
127
+ "dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
128
+ "same_data_policy": true,
129
+ "same_init_policy": true
130
+ }
131
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/adapter_noop_seed23.json ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_noop",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 1,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0
17
+ ],
18
+ "success_rate": 0.125,
19
+ "intervention_rate": 0.0,
20
+ "non_base_selection_rate": 0.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": true,
52
+ "steps": 1,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": false,
84
+ "steps": 4,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "adapter_noop",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone."
110
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "anchor_pass": true,
3
+ "available_tracks": [
4
+ "bag_track"
5
+ ],
6
+ "ci_above_zero_tracks": [],
7
+ "headline_pass": false,
8
+ "package_name": "public_reveal_retrieve_package_v1",
9
+ "sign_of_life_pass": false,
10
+ "sign_of_life_track_count": 0,
11
+ "sign_of_life_tracks": [],
12
+ "target_macro_average_delta": 0.0,
13
+ "tracks": {
14
+ "bag_track": {
15
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
16
+ "delta_active_vs_trunk": 0.0,
17
+ "delta_active_vs_trunk_ci95": [
18
+ -0.375,
19
+ 0.375
20
+ ],
21
+ "delta_noop_vs_trunk": 0.0,
22
+ "modes": {
23
+ "adapter_active_ft": {
24
+ "disturbance_proxy": 0.0,
25
+ "intervention_rate": 0.0,
26
+ "mean_success": 0.125,
27
+ "non_base_selection_rate": 0.0,
28
+ "num_runs": 1,
29
+ "steps_to_first_reveal_or_access": 1.0,
30
+ "steps_to_retrieve": 4.0
31
+ },
32
+ "adapter_noop": {
33
+ "disturbance_proxy": 0.0,
34
+ "intervention_rate": 0.0,
35
+ "mean_success": 0.125,
36
+ "non_base_selection_rate": 0.0,
37
+ "num_runs": 1,
38
+ "steps_to_first_reveal_or_access": 1.0,
39
+ "steps_to_retrieve": 4.0
40
+ },
41
+ "trunk_only_ft": {
42
+ "disturbance_proxy": 0.0,
43
+ "intervention_rate": 0.0,
44
+ "mean_success": 0.125,
45
+ "non_base_selection_rate": 0.0,
46
+ "num_runs": 1,
47
+ "steps_to_first_reveal_or_access": 1.0,
48
+ "steps_to_retrieve": 4.0
49
+ }
50
+ },
51
+ "notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
52
+ "public_source": "ManiSkill public scene proxy: PutEggplantInBasketScene-v1",
53
+ "role": "target",
54
+ "signs_of_life": false,
55
+ "suite": "maniskill3",
56
+ "target_behavior": "retrieve the target object from inside the basket and stage it outside the basket",
57
+ "task_family": "bag_retrieval_proxy"
58
+ }
59
+ }
60
+ }
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.md ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ManiSkill Bag Retrieval Smoke Summary
2
+
3
+ - benchmark_task: PutEggplantInBasketRetrievalProxy-v1
4
+ - target_macro_average_delta: 0.000
5
+ - headline_pass: False
6
+ - sign_of_life_pass: False
7
+
8
+ ## bag_track
9
+ - delta_active_vs_trunk: 0.000
10
+ - delta_noop_vs_trunk: 0.000
11
+ - signs_of_life: False
12
+ - delta_active_vs_trunk_ci95: [-0.375, 0.375]
13
+ - trunk_only_ft: mean_success=0.125
14
+ - adapter_noop: mean_success=0.125
15
+ - adapter_active_ft: mean_success=0.125
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/run.log ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
3
+ Key | Status | |
4
+ -------------------------------------+------------+--+-
5
+ vision_model.embeddings.position_ids | UNEXPECTED | |
6
+ text_model.embeddings.position_ids | UNEXPECTED | |
7
+
8
+ Notes:
9
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
10
+ CLIPTextTransformer does not expose input embeddings. Gradients cannot flow back to the token embeddings when using adapters or gradient checkpointing. Override `get_input_embeddings` to fully support those features, or set `_input_embed_layer` to the attribute name that holds the embeddings.
11
+ /usr/local/lib/python3.11/dist-packages/torch/nn/modules/transformer.py:307: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.norm_first was True
12
+ warnings.warn(f"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}")
13
+ 2026-04-01 11:29:21,719 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
14
+ 2026-04-01 11:29:21,764 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
15
+ 2026-04-01 11:29:21,777 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
16
+ 2026-04-01 11:29:22,382 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
17
+ 2026-04-01 11:29:22,384 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
18
+ 2026-04-01 11:29:22,384 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
19
+ /usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: WARN: env.get_obs to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_obs` for environment variables or `env.get_wrapper_attr('get_obs')` that will search the reminding wrappers.
20
+ logger.warn(
21
+ /usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: WARN: env.get_info to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_info` for environment variables or `env.get_wrapper_attr('get_info')` that will search the reminding wrappers.
22
+ logger.warn(
23
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171000, "success": false, "steps": 4}
24
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171001, "success": false, "steps": 4}
25
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171002, "success": false, "steps": 4}
26
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171003, "success": false, "steps": 4}
27
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171004, "success": false, "steps": 4}
28
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171005, "success": false, "steps": 4}
29
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171006, "success": false, "steps": 4}
30
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171007, "success": true, "steps": 1}
31
+
32
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
33
+ Key | Status | |
34
+ -------------------------------------+------------+--+-
35
+ vision_model.embeddings.position_ids | UNEXPECTED | |
36
+ text_model.embeddings.position_ids | UNEXPECTED | |
37
+
38
+ Notes:
39
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
40
+ 2026-04-01 11:29:55,476 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
41
+ 2026-04-01 11:29:55,480 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
42
+ 2026-04-01 11:29:55,480 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
43
+ 2026-04-01 11:29:55,702 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
44
+ 2026-04-01 11:29:55,705 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
45
+ 2026-04-01 11:29:55,705 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
46
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171000, "success": false, "steps": 4}
47
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171001, "success": false, "steps": 4}
48
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171002, "success": false, "steps": 4}
49
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171003, "success": true, "steps": 1}
50
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171004, "success": false, "steps": 4}
51
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171005, "success": false, "steps": 4}
52
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171006, "success": false, "steps": 4}
53
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171007, "success": false, "steps": 4}
54
+
55
+ CLIPModel LOAD REPORT from: openai/clip-vit-base-patch32
56
+ Key | Status | |
57
+ -------------------------------------+------------+--+-
58
+ vision_model.embeddings.position_ids | UNEXPECTED | |
59
+ text_model.embeddings.position_ids | UNEXPECTED | |
60
+
61
+ Notes:
62
+ - UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
63
+ 2026-04-01 11:30:24,855 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
64
+ 2026-04-01 11:30:24,857 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
65
+ 2026-04-01 11:30:24,857 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
66
+ 2026-04-01 11:30:25,079 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint
67
+ 2026-04-01 11:30:25,081 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
68
+ 2026-04-01 11:30:25,082 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.
69
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171000, "success": false, "steps": 4}
70
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171001, "success": false, "steps": 4}
71
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171002, "success": false, "steps": 4}
72
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171003, "success": true, "steps": 1}
73
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171004, "success": false, "steps": 4}
74
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171005, "success": false, "steps": 4}
75
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171006, "success": false, "steps": 4}
76
+ {"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171007, "success": false, "steps": 4}
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/trunk_only_ft_seed23.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "bag_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "trunk_only_ft",
7
+ "episodes": 8,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 1
17
+ ],
18
+ "success_rate": 0.125,
19
+ "intervention_rate": 0.0,
20
+ "non_base_selection_rate": 0.0,
21
+ "steps_to_first_reveal_or_access": 1.0,
22
+ "steps_to_retrieve": 4.0,
23
+ "disturbance_proxy": 0.0,
24
+ "episode_records": [
25
+ {
26
+ "episode_seed": 171000,
27
+ "success": false,
28
+ "steps": 4,
29
+ "first_reveal_step": 1,
30
+ "first_retrieve_step": null,
31
+ "episode_disturbance": 0.0
32
+ },
33
+ {
34
+ "episode_seed": 171001,
35
+ "success": false,
36
+ "steps": 4,
37
+ "first_reveal_step": 1,
38
+ "first_retrieve_step": null,
39
+ "episode_disturbance": 0.0
40
+ },
41
+ {
42
+ "episode_seed": 171002,
43
+ "success": false,
44
+ "steps": 4,
45
+ "first_reveal_step": 1,
46
+ "first_retrieve_step": null,
47
+ "episode_disturbance": 0.0
48
+ },
49
+ {
50
+ "episode_seed": 171003,
51
+ "success": false,
52
+ "steps": 4,
53
+ "first_reveal_step": 1,
54
+ "first_retrieve_step": null,
55
+ "episode_disturbance": 0.0
56
+ },
57
+ {
58
+ "episode_seed": 171004,
59
+ "success": false,
60
+ "steps": 4,
61
+ "first_reveal_step": 1,
62
+ "first_retrieve_step": null,
63
+ "episode_disturbance": 0.0
64
+ },
65
+ {
66
+ "episode_seed": 171005,
67
+ "success": false,
68
+ "steps": 4,
69
+ "first_reveal_step": 1,
70
+ "first_retrieve_step": null,
71
+ "episode_disturbance": 0.0
72
+ },
73
+ {
74
+ "episode_seed": 171006,
75
+ "success": false,
76
+ "steps": 4,
77
+ "first_reveal_step": 1,
78
+ "first_retrieve_step": null,
79
+ "episode_disturbance": 0.0
80
+ },
81
+ {
82
+ "episode_seed": 171007,
83
+ "success": true,
84
+ "steps": 1,
85
+ "first_reveal_step": 1,
86
+ "first_retrieve_step": null,
87
+ "episode_disturbance": 0.0
88
+ }
89
+ ],
90
+ "eval_protocol": {
91
+ "track_id": "bag_track",
92
+ "suite": "maniskill3",
93
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
94
+ "role": "target",
95
+ "eval_mode": "trunk_only_ft",
96
+ "seed": 17,
97
+ "episodes": 8,
98
+ "resolution": 224,
99
+ "cameras": [
100
+ "front",
101
+ "left",
102
+ "right"
103
+ ],
104
+ "observation_stack": "rgb_triplicate_zero_depth",
105
+ "action_horizon": 8,
106
+ "action_space": "widowx_delta_pose",
107
+ "same_test_episodes": true
108
+ },
109
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
110
+ "train_spec": {
111
+ "track_id": "bag_track",
112
+ "suite": "maniskill3",
113
+ "benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
114
+ "model_variant": "trunk_only_ft",
115
+ "seed": 23,
116
+ "train_demos": 32,
117
+ "val_demos": 8,
118
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
119
+ "optimizer": "adamw",
120
+ "learning_rate": 0.0001,
121
+ "lr_schedule": "constant",
122
+ "batch_size": 4,
123
+ "augmentations": "none",
124
+ "early_stopping_metric": "val_total",
125
+ "max_gradient_steps": 114,
126
+ "unfreeze_scope": "fusion_memory_decoder",
127
+ "dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
128
+ "same_data_policy": true,
129
+ "same_init_policy": true
130
+ }
131
+ }
reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed17.json ADDED
@@ -0,0 +1,509 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_active_ft",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 1,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 1,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 1,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 0,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 1,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 1,
58
+ 0
59
+ ],
60
+ "success_rate": 0.1,
61
+ "intervention_rate": 0.33689839572192515,
62
+ "non_base_selection_rate": 0.26737967914438504,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1649820935726166,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.0
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": true,
78
+ "steps": 1,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 1.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.0
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.0
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.25
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.25
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.25
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.0
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.25
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": true,
198
+ "steps": 1,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 1.0
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.0
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.0
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.0
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": true,
238
+ "steps": 2,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.3782343992165157
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.25
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.25
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.16025998336928232
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": false,
302
+ "steps": 4,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.0
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.0
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.25
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.008142942828791497
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.0
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": true,
382
+ "steps": 1,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 1.0
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.0
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.10258094114916666
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.23011721244880132
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.18159967022282736
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.01112700679472516
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.1770425226007189
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.0
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.25
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": true,
454
+ "steps": 2,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.0
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.0
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_active_ft",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
488
+ "train_spec": {
489
+ "track_id": "cloth_track",
490
+ "suite": "maniskill3",
491
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
492
+ "model_variant": "adapter_active_ft",
493
+ "seed": 17,
494
+ "train_demos": 32,
495
+ "val_demos": 8,
496
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
497
+ "optimizer": "adamw",
498
+ "learning_rate": 0.0001,
499
+ "lr_schedule": "constant",
500
+ "batch_size": 4,
501
+ "augmentations": "none",
502
+ "early_stopping_metric": "val_total",
503
+ "max_gradient_steps": 174,
504
+ "unfreeze_scope": "fusion_memory_decoder",
505
+ "dataset_split_id": "cloth_bridge_smoke_v1_seed17",
506
+ "same_data_policy": true,
507
+ "same_init_policy": true
508
+ }
509
+ }
reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed23.json ADDED
@@ -0,0 +1,509 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_active_ft",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 1,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 0,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.02,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.12309578397444318,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.25
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": false,
78
+ "steps": 4,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 0.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.12488718117986407
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.25
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.0
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.0
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.0
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.0
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.0
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.25
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.0
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.0
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.0
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": true,
238
+ "steps": 2,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.3782343992165157
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.25
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.25
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": false,
302
+ "steps": 4,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.25
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.25
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.25
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.046899239931787774
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.10476837839399065
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.0
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.0
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.25
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.0
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.25
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.25
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_active_ft",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
488
+ "train_spec": {
489
+ "track_id": "cloth_track",
490
+ "suite": "maniskill3",
491
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
492
+ "model_variant": "adapter_active_ft",
493
+ "seed": 23,
494
+ "train_demos": 32,
495
+ "val_demos": 8,
496
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
497
+ "optimizer": "adamw",
498
+ "learning_rate": 0.0001,
499
+ "lr_schedule": "constant",
500
+ "batch_size": 4,
501
+ "augmentations": "none",
502
+ "early_stopping_metric": "val_total",
503
+ "max_gradient_steps": 174,
504
+ "unfreeze_scope": "fusion_memory_decoder",
505
+ "dataset_split_id": "cloth_bridge_smoke_v1_seed17",
506
+ "same_data_policy": true,
507
+ "same_init_policy": true
508
+ }
509
+ }
reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed29.json ADDED
@@ -0,0 +1,509 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_active_ft",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 1,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 1,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.04,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1478596130013466,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.0
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": true,
78
+ "steps": 1,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 1.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.0
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.0
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.25
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.25
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.25
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.25
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.25
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.0
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.25
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.25
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.25
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.0
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.0
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": true,
302
+ "steps": 2,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.5
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.0
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.0
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.25
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.1429806500673294
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.25
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.0
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.25
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.0
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.0
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_active_ft",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
488
+ "train_spec": {
489
+ "track_id": "cloth_track",
490
+ "suite": "maniskill3",
491
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
492
+ "model_variant": "adapter_active_ft",
493
+ "seed": 29,
494
+ "train_demos": 32,
495
+ "val_demos": 8,
496
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
497
+ "optimizer": "adamw",
498
+ "learning_rate": 0.0001,
499
+ "lr_schedule": "constant",
500
+ "batch_size": 4,
501
+ "augmentations": "none",
502
+ "early_stopping_metric": "val_total",
503
+ "max_gradient_steps": 174,
504
+ "unfreeze_scope": "fusion_memory_decoder",
505
+ "dataset_split_id": "cloth_bridge_smoke_v1_seed17",
506
+ "same_data_policy": true,
507
+ "same_init_policy": true
508
+ }
509
+ }
reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed17.json ADDED
@@ -0,0 +1,488 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_noop",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 1,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 1,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.04,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1478596130013466,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.0
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": true,
78
+ "steps": 1,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 1.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.0
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.0
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.25
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.25
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.25
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.25
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.25
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.0
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.25
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.25
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.25
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.0
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.0
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": true,
302
+ "steps": 2,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.5
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.0
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.0
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.25
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.1429806500673294
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.25
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.0
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.25
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.0
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.0
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_noop",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table."
488
+ }
reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed23.json ADDED
@@ -0,0 +1,488 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_noop",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 1,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 0,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.02,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.12309578397444318,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.25
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": false,
78
+ "steps": 4,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 0.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.12488718117986407
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.25
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.0
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.0
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.0
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.0
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.0
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.25
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.0
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.0
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.0
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": true,
238
+ "steps": 2,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.3782343992165157
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.25
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.25
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": false,
302
+ "steps": 4,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.25
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.25
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.25
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.046899239931787774
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.10476837839399065
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.0
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.0
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.25
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.0
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.25
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.25
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_noop",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table."
488
+ }
reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed29.json ADDED
@@ -0,0 +1,488 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_noop",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 1,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 1,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.04,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1478596130013466,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.0
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": true,
78
+ "steps": 1,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 1.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.0
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.0
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.25
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.25
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.25
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.25
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.25
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.0
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.25
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.25
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.25
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.0
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.0
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": true,
302
+ "steps": 2,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.5
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.0
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.0
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.25
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.1429806500673294
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.25
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.0
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.25
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.0
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.0
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_noop",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table."
488
+ }
reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "anchor_pass": true,
3
+ "available_tracks": [
4
+ "cloth_track"
5
+ ],
6
+ "ci_above_zero_tracks": [],
7
+ "headline_pass": false,
8
+ "package_name": "public_reveal_retrieve_package_v1",
9
+ "sign_of_life_pass": false,
10
+ "sign_of_life_track_count": 0,
11
+ "sign_of_life_tracks": [],
12
+ "target_macro_average_delta": 0.0,
13
+ "tracks": {
14
+ "cloth_track": {
15
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
16
+ "delta_active_vs_trunk": 0.0,
17
+ "delta_active_vs_trunk_ci95": [
18
+ -0.07999999821186066,
19
+ 0.07999999821186066
20
+ ],
21
+ "delta_noop_vs_trunk": 0.0,
22
+ "modes": {
23
+ "adapter_active_ft": {
24
+ "disturbance_proxy": 0.1478596130013466,
25
+ "intervention_rate": 0.0,
26
+ "mean_success": 0.03999999910593033,
27
+ "non_base_selection_rate": 0.0,
28
+ "num_runs": 1,
29
+ "steps_to_first_reveal_or_access": 1.0,
30
+ "steps_to_retrieve": 4.0
31
+ },
32
+ "adapter_noop": {
33
+ "disturbance_proxy": 0.1478596130013466,
34
+ "intervention_rate": 0.0,
35
+ "mean_success": 0.03999999910593033,
36
+ "non_base_selection_rate": 0.0,
37
+ "num_runs": 1,
38
+ "steps_to_first_reveal_or_access": 1.0,
39
+ "steps_to_retrieve": 4.0
40
+ },
41
+ "trunk_only_ft": {
42
+ "disturbance_proxy": 0.1478596130013466,
43
+ "intervention_rate": 0.0,
44
+ "mean_success": 0.03999999910593033,
45
+ "non_base_selection_rate": 0.0,
46
+ "num_runs": 1,
47
+ "steps_to_first_reveal_or_access": 1.0,
48
+ "steps_to_retrieve": 4.0
49
+ }
50
+ },
51
+ "notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
52
+ "public_source": "ManiSkill public scene proxy: PutSpoonOnTableClothInScene-v1",
53
+ "role": "target",
54
+ "signs_of_life": false,
55
+ "suite": "maniskill3",
56
+ "target_behavior": "reveal the spoon from under the cloth and retrieve it to the open area",
57
+ "task_family": "cloth_retrieval_proxy"
58
+ }
59
+ }
60
+ }
reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.md ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ManiSkill Cloth Retrieval Smoke Summary
2
+
3
+ - benchmark_task: PutSpoonUnderClothRetrievalProxy-v1
4
+ - target_macro_average_delta: 0.000
5
+ - headline_pass: False
6
+ - sign_of_life_pass: False
7
+
8
+ ## cloth_track
9
+ - delta_active_vs_trunk: 0.000
10
+ - delta_noop_vs_trunk: 0.000
11
+ - signs_of_life: False
12
+ - delta_active_vs_trunk_ci95: [-0.080, 0.080]
13
+ - trunk_only_ft: mean_success=0.040
14
+ - adapter_noop: mean_success=0.040
15
+ - adapter_active_ft: mean_success=0.040
reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed17.json ADDED
@@ -0,0 +1,509 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "trunk_only_ft",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 1,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 1,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.04,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1478596130013466,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.0
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": true,
78
+ "steps": 1,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 1.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.0
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.0
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.25
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.25
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.25
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.25
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.25
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.0
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.25
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.25
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.25
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.0
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.0
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": true,
302
+ "steps": 2,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.5
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.0
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.0
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.25
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.1429806500673294
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.25
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.0
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.25
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.0
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.0
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "trunk_only_ft",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
488
+ "train_spec": {
489
+ "track_id": "cloth_track",
490
+ "suite": "maniskill3",
491
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
492
+ "model_variant": "trunk_only_ft",
493
+ "seed": 17,
494
+ "train_demos": 32,
495
+ "val_demos": 8,
496
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
497
+ "optimizer": "adamw",
498
+ "learning_rate": 0.0001,
499
+ "lr_schedule": "constant",
500
+ "batch_size": 4,
501
+ "augmentations": "none",
502
+ "early_stopping_metric": "val_total",
503
+ "max_gradient_steps": 174,
504
+ "unfreeze_scope": "fusion_memory_decoder",
505
+ "dataset_split_id": "cloth_bridge_smoke_v1_seed17",
506
+ "same_data_policy": true,
507
+ "same_init_policy": true
508
+ }
509
+ }
reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed23.json ADDED
@@ -0,0 +1,509 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "trunk_only_ft",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 1,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 1,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.04,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1478596130013466,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.0
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": true,
78
+ "steps": 1,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 1.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.0
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.0
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.25
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.25
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.25
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.25
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.25
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.0
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.25
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.25
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.25
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.0
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.0
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": true,
302
+ "steps": 2,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.5
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.0
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.0
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.25
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.1429806500673294
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.25
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.0
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.25
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.0
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.0
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "trunk_only_ft",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
488
+ "train_spec": {
489
+ "track_id": "cloth_track",
490
+ "suite": "maniskill3",
491
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
492
+ "model_variant": "trunk_only_ft",
493
+ "seed": 23,
494
+ "train_demos": 32,
495
+ "val_demos": 8,
496
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
497
+ "optimizer": "adamw",
498
+ "learning_rate": 0.0001,
499
+ "lr_schedule": "constant",
500
+ "batch_size": 4,
501
+ "augmentations": "none",
502
+ "early_stopping_metric": "val_total",
503
+ "max_gradient_steps": 174,
504
+ "unfreeze_scope": "fusion_memory_decoder",
505
+ "dataset_split_id": "cloth_bridge_smoke_v1_seed17",
506
+ "same_data_policy": true,
507
+ "same_init_policy": true
508
+ }
509
+ }
reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed29.json ADDED
@@ -0,0 +1,509 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "cloth_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
5
+ "role": "target",
6
+ "adapter_mode": "trunk_only_ft",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 1,
11
+ 0,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 0,
26
+ 0,
27
+ 0,
28
+ 0,
29
+ 0,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 0,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 1,
39
+ 0,
40
+ 0,
41
+ 0,
42
+ 0,
43
+ 0,
44
+ 0,
45
+ 0,
46
+ 0,
47
+ 0,
48
+ 0,
49
+ 0,
50
+ 0,
51
+ 0,
52
+ 0,
53
+ 0,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 0
59
+ ],
60
+ "success_rate": 0.04,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1478596130013466,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 170104,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.0
74
+ },
75
+ {
76
+ "episode_seed": 170105,
77
+ "success": true,
78
+ "steps": 1,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 1.0
82
+ },
83
+ {
84
+ "episode_seed": 170106,
85
+ "success": false,
86
+ "steps": 4,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.25
90
+ },
91
+ {
92
+ "episode_seed": 170107,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 0.0
98
+ },
99
+ {
100
+ "episode_seed": 170109,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.25
106
+ },
107
+ {
108
+ "episode_seed": 170113,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.0
114
+ },
115
+ {
116
+ "episode_seed": 170117,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.25
122
+ },
123
+ {
124
+ "episode_seed": 170121,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.25
130
+ },
131
+ {
132
+ "episode_seed": 170124,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.25
138
+ },
139
+ {
140
+ "episode_seed": 170125,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.0
146
+ },
147
+ {
148
+ "episode_seed": 170129,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.0
154
+ },
155
+ {
156
+ "episode_seed": 170131,
157
+ "success": false,
158
+ "steps": 4,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.0
162
+ },
163
+ {
164
+ "episode_seed": 170137,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.25
170
+ },
171
+ {
172
+ "episode_seed": 170138,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.25
178
+ },
179
+ {
180
+ "episode_seed": 170139,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.25
186
+ },
187
+ {
188
+ "episode_seed": 170140,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.25
194
+ },
195
+ {
196
+ "episode_seed": 170145,
197
+ "success": false,
198
+ "steps": 4,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 0.0
202
+ },
203
+ {
204
+ "episode_seed": 170150,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.25
210
+ },
211
+ {
212
+ "episode_seed": 170151,
213
+ "success": false,
214
+ "steps": 4,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 0.0
218
+ },
219
+ {
220
+ "episode_seed": 170153,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25
226
+ },
227
+ {
228
+ "episode_seed": 170154,
229
+ "success": false,
230
+ "steps": 4,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.25
234
+ },
235
+ {
236
+ "episode_seed": 170155,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.25
242
+ },
243
+ {
244
+ "episode_seed": 170166,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.0
250
+ },
251
+ {
252
+ "episode_seed": 170171,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.25
258
+ },
259
+ {
260
+ "episode_seed": 170173,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.0
266
+ },
267
+ {
268
+ "episode_seed": 170175,
269
+ "success": false,
270
+ "steps": 4,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.0
274
+ },
275
+ {
276
+ "episode_seed": 170177,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.0
282
+ },
283
+ {
284
+ "episode_seed": 170180,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.25
290
+ },
291
+ {
292
+ "episode_seed": 170181,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.25
298
+ },
299
+ {
300
+ "episode_seed": 170184,
301
+ "success": true,
302
+ "steps": 2,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 0.5
306
+ },
307
+ {
308
+ "episode_seed": 170185,
309
+ "success": false,
310
+ "steps": 4,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.25
314
+ },
315
+ {
316
+ "episode_seed": 170186,
317
+ "success": false,
318
+ "steps": 4,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.0
322
+ },
323
+ {
324
+ "episode_seed": 170198,
325
+ "success": false,
326
+ "steps": 4,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.0
330
+ },
331
+ {
332
+ "episode_seed": 170200,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.0
338
+ },
339
+ {
340
+ "episode_seed": 170205,
341
+ "success": false,
342
+ "steps": 4,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.0
346
+ },
347
+ {
348
+ "episode_seed": 170207,
349
+ "success": false,
350
+ "steps": 4,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.25
354
+ },
355
+ {
356
+ "episode_seed": 170208,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.25
362
+ },
363
+ {
364
+ "episode_seed": 170212,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.25
370
+ },
371
+ {
372
+ "episode_seed": 170214,
373
+ "success": false,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.0
378
+ },
379
+ {
380
+ "episode_seed": 170217,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0
386
+ },
387
+ {
388
+ "episode_seed": 170223,
389
+ "success": false,
390
+ "steps": 4,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.1429806500673294
394
+ },
395
+ {
396
+ "episode_seed": 170226,
397
+ "success": false,
398
+ "steps": 4,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.25
402
+ },
403
+ {
404
+ "episode_seed": 170228,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.0
410
+ },
411
+ {
412
+ "episode_seed": 170229,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0
418
+ },
419
+ {
420
+ "episode_seed": 170234,
421
+ "success": false,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0
426
+ },
427
+ {
428
+ "episode_seed": 170237,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.0
434
+ },
435
+ {
436
+ "episode_seed": 170239,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.25
442
+ },
443
+ {
444
+ "episode_seed": 170241,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.0
450
+ },
451
+ {
452
+ "episode_seed": 170242,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.0
458
+ },
459
+ {
460
+ "episode_seed": 170243,
461
+ "success": false,
462
+ "steps": 4,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.25
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "cloth_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
472
+ "role": "target",
473
+ "eval_mode": "trunk_only_ft",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgb_triplicate_zero_depth",
483
+ "action_horizon": 8,
484
+ "action_space": "widowx_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
488
+ "train_spec": {
489
+ "track_id": "cloth_track",
490
+ "suite": "maniskill3",
491
+ "benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
492
+ "model_variant": "trunk_only_ft",
493
+ "seed": 29,
494
+ "train_demos": 32,
495
+ "val_demos": 8,
496
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
497
+ "optimizer": "adamw",
498
+ "learning_rate": 0.0001,
499
+ "lr_schedule": "constant",
500
+ "batch_size": 4,
501
+ "augmentations": "none",
502
+ "early_stopping_metric": "val_total",
503
+ "max_gradient_steps": 174,
504
+ "unfreeze_scope": "fusion_memory_decoder",
505
+ "dataset_split_id": "cloth_bridge_smoke_v1_seed17",
506
+ "same_data_policy": true,
507
+ "same_init_policy": true
508
+ }
509
+ }
reports/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "occlusion_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PickClutterYCB-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_active_ft",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 1,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 1,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 1,
26
+ 0,
27
+ 1,
28
+ 0,
29
+ 1,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 1,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 0,
39
+ 1,
40
+ 1,
41
+ 1,
42
+ 0,
43
+ 1,
44
+ 1,
45
+ 0,
46
+ 0,
47
+ 1,
48
+ 0,
49
+ 1,
50
+ 1,
51
+ 0,
52
+ 0,
53
+ 1,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 1
59
+ ],
60
+ "success_rate": 0.32,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1261227352138143,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 172000,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.11835007230072728
74
+ },
75
+ {
76
+ "episode_seed": 172001,
77
+ "success": false,
78
+ "steps": 4,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 0.16761024718687167
82
+ },
83
+ {
84
+ "episode_seed": 172002,
85
+ "success": true,
86
+ "steps": 1,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.0019509782725606326
90
+ },
91
+ {
92
+ "episode_seed": 172003,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 7.148081446217702e-05
98
+ },
99
+ {
100
+ "episode_seed": 172004,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.1784248970780015
106
+ },
107
+ {
108
+ "episode_seed": 172005,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.09801531238412764
114
+ },
115
+ {
116
+ "episode_seed": 172006,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.0005962321008468051
122
+ },
123
+ {
124
+ "episode_seed": 172007,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.1259510057686978
130
+ },
131
+ {
132
+ "episode_seed": 172008,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.11488150802027317
138
+ },
139
+ {
140
+ "episode_seed": 172009,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.04447960518379812
146
+ },
147
+ {
148
+ "episode_seed": 172010,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.28255011429793786
154
+ },
155
+ {
156
+ "episode_seed": 172011,
157
+ "success": true,
158
+ "steps": 3,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.04106344052554118
162
+ },
163
+ {
164
+ "episode_seed": 172012,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.07076599070619194
170
+ },
171
+ {
172
+ "episode_seed": 172013,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.13973692647627903
178
+ },
179
+ {
180
+ "episode_seed": 172014,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.004788672381939665
186
+ },
187
+ {
188
+ "episode_seed": 172015,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.28083725664289716
194
+ },
195
+ {
196
+ "episode_seed": 172016,
197
+ "success": true,
198
+ "steps": 1,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 1.0
202
+ },
203
+ {
204
+ "episode_seed": 172017,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.1641496366673234
210
+ },
211
+ {
212
+ "episode_seed": 172018,
213
+ "success": true,
214
+ "steps": 1,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 4.383633944371468e-05
218
+ },
219
+ {
220
+ "episode_seed": 172019,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25721585358608956
226
+ },
227
+ {
228
+ "episode_seed": 172020,
229
+ "success": true,
230
+ "steps": 3,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.17401533717143602
234
+ },
235
+ {
236
+ "episode_seed": 172021,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.006582688272562364
242
+ },
243
+ {
244
+ "episode_seed": 172022,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.061462426746240105
250
+ },
251
+ {
252
+ "episode_seed": 172023,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.26208380581626045
258
+ },
259
+ {
260
+ "episode_seed": 172024,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.17481319658276814
266
+ },
267
+ {
268
+ "episode_seed": 172025,
269
+ "success": true,
270
+ "steps": 2,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.011393342883305735
274
+ },
275
+ {
276
+ "episode_seed": 172026,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.040603790066086276
282
+ },
283
+ {
284
+ "episode_seed": 172027,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.001898237613124465
290
+ },
291
+ {
292
+ "episode_seed": 172028,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.1535773960429528
298
+ },
299
+ {
300
+ "episode_seed": 172029,
301
+ "success": false,
302
+ "steps": 4,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 2.6297170183653403e-05
306
+ },
307
+ {
308
+ "episode_seed": 172030,
309
+ "success": true,
310
+ "steps": 3,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.23568911686727625
314
+ },
315
+ {
316
+ "episode_seed": 172031,
317
+ "success": true,
318
+ "steps": 2,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.05458565396336822
322
+ },
323
+ {
324
+ "episode_seed": 172032,
325
+ "success": true,
326
+ "steps": 2,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.23615429148293285
330
+ },
331
+ {
332
+ "episode_seed": 172033,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.3794685144275167
338
+ },
339
+ {
340
+ "episode_seed": 172034,
341
+ "success": true,
342
+ "steps": 2,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.23963101771263
346
+ },
347
+ {
348
+ "episode_seed": 172035,
349
+ "success": true,
350
+ "steps": 3,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.1458236509853299
354
+ },
355
+ {
356
+ "episode_seed": 172036,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.0005504064674610731
362
+ },
363
+ {
364
+ "episode_seed": 172037,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.02395525002599186
370
+ },
371
+ {
372
+ "episode_seed": 172038,
373
+ "success": true,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.002132451383634048
378
+ },
379
+ {
380
+ "episode_seed": 172039,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0008329380843482188
386
+ },
387
+ {
388
+ "episode_seed": 172040,
389
+ "success": true,
390
+ "steps": 2,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.06136600544187113
394
+ },
395
+ {
396
+ "episode_seed": 172041,
397
+ "success": true,
398
+ "steps": 1,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.1345306197528089
402
+ },
403
+ {
404
+ "episode_seed": 172042,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.15628500139711843
410
+ },
411
+ {
412
+ "episode_seed": 172043,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0589350413731123
418
+ },
419
+ {
420
+ "episode_seed": 172044,
421
+ "success": true,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0012772400607863332
426
+ },
427
+ {
428
+ "episode_seed": 172045,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.014964900854341323
434
+ },
435
+ {
436
+ "episode_seed": 172046,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.00010739007165527781
442
+ },
443
+ {
444
+ "episode_seed": 172047,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.3118926811146435
450
+ },
451
+ {
452
+ "episode_seed": 172048,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.09965736700647154
458
+ },
459
+ {
460
+ "episode_seed": 172049,
461
+ "success": true,
462
+ "steps": 3,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.17035763711848637
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "occlusion_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PickClutterYCB-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_active_ft",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgbd_3cam",
483
+ "action_horizon": 8,
484
+ "action_space": "bimanual_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "train_spec": {
488
+ "track_id": "occlusion_track",
489
+ "suite": "maniskill3",
490
+ "benchmark_task": "PickClutterYCB-v1",
491
+ "model_variant": "adapter_active_ft",
492
+ "seed": 17,
493
+ "train_demos": 32,
494
+ "val_demos": 8,
495
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
496
+ "optimizer": "adamw",
497
+ "learning_rate": 0.0001,
498
+ "lr_schedule": "constant",
499
+ "batch_size": 4,
500
+ "augmentations": "none",
501
+ "early_stopping_metric": "val_total",
502
+ "max_gradient_steps": 144,
503
+ "unfreeze_scope": "fusion_memory_decoder",
504
+ "dataset_split_id": "pickclutter_smoke_v2_seed17",
505
+ "same_data_policy": true,
506
+ "same_init_policy": true
507
+ }
508
+ }
reports/maniskill_pickclutter_smoke_v2/adapter_noop_seed17.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "track_id": "occlusion_track",
3
+ "suite": "maniskill3",
4
+ "benchmark_task": "PickClutterYCB-v1",
5
+ "role": "target",
6
+ "adapter_mode": "adapter_noop",
7
+ "episodes": 50,
8
+ "successes": [
9
+ 0,
10
+ 0,
11
+ 1,
12
+ 0,
13
+ 0,
14
+ 0,
15
+ 0,
16
+ 0,
17
+ 0,
18
+ 0,
19
+ 0,
20
+ 1,
21
+ 0,
22
+ 0,
23
+ 0,
24
+ 0,
25
+ 1,
26
+ 0,
27
+ 1,
28
+ 0,
29
+ 1,
30
+ 0,
31
+ 0,
32
+ 0,
33
+ 0,
34
+ 1,
35
+ 0,
36
+ 0,
37
+ 0,
38
+ 0,
39
+ 1,
40
+ 1,
41
+ 1,
42
+ 0,
43
+ 1,
44
+ 1,
45
+ 0,
46
+ 0,
47
+ 1,
48
+ 0,
49
+ 1,
50
+ 1,
51
+ 0,
52
+ 0,
53
+ 1,
54
+ 0,
55
+ 0,
56
+ 0,
57
+ 0,
58
+ 1
59
+ ],
60
+ "success_rate": 0.32,
61
+ "intervention_rate": 0.0,
62
+ "non_base_selection_rate": 0.0,
63
+ "steps_to_first_reveal_or_access": 1.0,
64
+ "steps_to_retrieve": 4.0,
65
+ "disturbance_proxy": 0.1261227352138143,
66
+ "episode_records": [
67
+ {
68
+ "episode_seed": 172000,
69
+ "success": false,
70
+ "steps": 4,
71
+ "first_reveal_step": 1,
72
+ "first_retrieve_step": null,
73
+ "episode_disturbance": 0.11835007230072728
74
+ },
75
+ {
76
+ "episode_seed": 172001,
77
+ "success": false,
78
+ "steps": 4,
79
+ "first_reveal_step": 1,
80
+ "first_retrieve_step": null,
81
+ "episode_disturbance": 0.16761024718687167
82
+ },
83
+ {
84
+ "episode_seed": 172002,
85
+ "success": true,
86
+ "steps": 1,
87
+ "first_reveal_step": 1,
88
+ "first_retrieve_step": null,
89
+ "episode_disturbance": 0.0019509782725606326
90
+ },
91
+ {
92
+ "episode_seed": 172003,
93
+ "success": false,
94
+ "steps": 4,
95
+ "first_reveal_step": 1,
96
+ "first_retrieve_step": null,
97
+ "episode_disturbance": 7.148081446217702e-05
98
+ },
99
+ {
100
+ "episode_seed": 172004,
101
+ "success": false,
102
+ "steps": 4,
103
+ "first_reveal_step": 1,
104
+ "first_retrieve_step": null,
105
+ "episode_disturbance": 0.1784248970780015
106
+ },
107
+ {
108
+ "episode_seed": 172005,
109
+ "success": false,
110
+ "steps": 4,
111
+ "first_reveal_step": 1,
112
+ "first_retrieve_step": null,
113
+ "episode_disturbance": 0.09801531238412764
114
+ },
115
+ {
116
+ "episode_seed": 172006,
117
+ "success": false,
118
+ "steps": 4,
119
+ "first_reveal_step": 1,
120
+ "first_retrieve_step": null,
121
+ "episode_disturbance": 0.0005962321008468051
122
+ },
123
+ {
124
+ "episode_seed": 172007,
125
+ "success": false,
126
+ "steps": 4,
127
+ "first_reveal_step": 1,
128
+ "first_retrieve_step": null,
129
+ "episode_disturbance": 0.1259510057686978
130
+ },
131
+ {
132
+ "episode_seed": 172008,
133
+ "success": false,
134
+ "steps": 4,
135
+ "first_reveal_step": 1,
136
+ "first_retrieve_step": null,
137
+ "episode_disturbance": 0.11488150802027317
138
+ },
139
+ {
140
+ "episode_seed": 172009,
141
+ "success": false,
142
+ "steps": 4,
143
+ "first_reveal_step": 1,
144
+ "first_retrieve_step": null,
145
+ "episode_disturbance": 0.04447960518379812
146
+ },
147
+ {
148
+ "episode_seed": 172010,
149
+ "success": false,
150
+ "steps": 4,
151
+ "first_reveal_step": 1,
152
+ "first_retrieve_step": null,
153
+ "episode_disturbance": 0.28255011429793786
154
+ },
155
+ {
156
+ "episode_seed": 172011,
157
+ "success": true,
158
+ "steps": 3,
159
+ "first_reveal_step": 1,
160
+ "first_retrieve_step": null,
161
+ "episode_disturbance": 0.04106344052554118
162
+ },
163
+ {
164
+ "episode_seed": 172012,
165
+ "success": false,
166
+ "steps": 4,
167
+ "first_reveal_step": 1,
168
+ "first_retrieve_step": null,
169
+ "episode_disturbance": 0.07076599070619194
170
+ },
171
+ {
172
+ "episode_seed": 172013,
173
+ "success": false,
174
+ "steps": 4,
175
+ "first_reveal_step": 1,
176
+ "first_retrieve_step": null,
177
+ "episode_disturbance": 0.13973692647627903
178
+ },
179
+ {
180
+ "episode_seed": 172014,
181
+ "success": false,
182
+ "steps": 4,
183
+ "first_reveal_step": 1,
184
+ "first_retrieve_step": null,
185
+ "episode_disturbance": 0.004788672381939665
186
+ },
187
+ {
188
+ "episode_seed": 172015,
189
+ "success": false,
190
+ "steps": 4,
191
+ "first_reveal_step": 1,
192
+ "first_retrieve_step": null,
193
+ "episode_disturbance": 0.28083725664289716
194
+ },
195
+ {
196
+ "episode_seed": 172016,
197
+ "success": true,
198
+ "steps": 1,
199
+ "first_reveal_step": 1,
200
+ "first_retrieve_step": null,
201
+ "episode_disturbance": 1.0
202
+ },
203
+ {
204
+ "episode_seed": 172017,
205
+ "success": false,
206
+ "steps": 4,
207
+ "first_reveal_step": 1,
208
+ "first_retrieve_step": null,
209
+ "episode_disturbance": 0.1641496366673234
210
+ },
211
+ {
212
+ "episode_seed": 172018,
213
+ "success": true,
214
+ "steps": 1,
215
+ "first_reveal_step": 1,
216
+ "first_retrieve_step": null,
217
+ "episode_disturbance": 4.383633944371468e-05
218
+ },
219
+ {
220
+ "episode_seed": 172019,
221
+ "success": false,
222
+ "steps": 4,
223
+ "first_reveal_step": 1,
224
+ "first_retrieve_step": null,
225
+ "episode_disturbance": 0.25721585358608956
226
+ },
227
+ {
228
+ "episode_seed": 172020,
229
+ "success": true,
230
+ "steps": 3,
231
+ "first_reveal_step": 1,
232
+ "first_retrieve_step": null,
233
+ "episode_disturbance": 0.17401533717143602
234
+ },
235
+ {
236
+ "episode_seed": 172021,
237
+ "success": false,
238
+ "steps": 4,
239
+ "first_reveal_step": 1,
240
+ "first_retrieve_step": null,
241
+ "episode_disturbance": 0.006582688272562364
242
+ },
243
+ {
244
+ "episode_seed": 172022,
245
+ "success": false,
246
+ "steps": 4,
247
+ "first_reveal_step": 1,
248
+ "first_retrieve_step": null,
249
+ "episode_disturbance": 0.061462426746240105
250
+ },
251
+ {
252
+ "episode_seed": 172023,
253
+ "success": false,
254
+ "steps": 4,
255
+ "first_reveal_step": 1,
256
+ "first_retrieve_step": null,
257
+ "episode_disturbance": 0.26208380581626045
258
+ },
259
+ {
260
+ "episode_seed": 172024,
261
+ "success": false,
262
+ "steps": 4,
263
+ "first_reveal_step": 1,
264
+ "first_retrieve_step": null,
265
+ "episode_disturbance": 0.17481319658276814
266
+ },
267
+ {
268
+ "episode_seed": 172025,
269
+ "success": true,
270
+ "steps": 2,
271
+ "first_reveal_step": 1,
272
+ "first_retrieve_step": null,
273
+ "episode_disturbance": 0.011393342883305735
274
+ },
275
+ {
276
+ "episode_seed": 172026,
277
+ "success": false,
278
+ "steps": 4,
279
+ "first_reveal_step": 1,
280
+ "first_retrieve_step": null,
281
+ "episode_disturbance": 0.040603790066086276
282
+ },
283
+ {
284
+ "episode_seed": 172027,
285
+ "success": false,
286
+ "steps": 4,
287
+ "first_reveal_step": 1,
288
+ "first_retrieve_step": null,
289
+ "episode_disturbance": 0.001898237613124465
290
+ },
291
+ {
292
+ "episode_seed": 172028,
293
+ "success": false,
294
+ "steps": 4,
295
+ "first_reveal_step": 1,
296
+ "first_retrieve_step": null,
297
+ "episode_disturbance": 0.1535773960429528
298
+ },
299
+ {
300
+ "episode_seed": 172029,
301
+ "success": false,
302
+ "steps": 4,
303
+ "first_reveal_step": 1,
304
+ "first_retrieve_step": null,
305
+ "episode_disturbance": 2.6297170183653403e-05
306
+ },
307
+ {
308
+ "episode_seed": 172030,
309
+ "success": true,
310
+ "steps": 3,
311
+ "first_reveal_step": 1,
312
+ "first_retrieve_step": null,
313
+ "episode_disturbance": 0.23568911686727625
314
+ },
315
+ {
316
+ "episode_seed": 172031,
317
+ "success": true,
318
+ "steps": 2,
319
+ "first_reveal_step": 1,
320
+ "first_retrieve_step": null,
321
+ "episode_disturbance": 0.05458565396336822
322
+ },
323
+ {
324
+ "episode_seed": 172032,
325
+ "success": true,
326
+ "steps": 2,
327
+ "first_reveal_step": 1,
328
+ "first_retrieve_step": null,
329
+ "episode_disturbance": 0.23615429148293285
330
+ },
331
+ {
332
+ "episode_seed": 172033,
333
+ "success": false,
334
+ "steps": 4,
335
+ "first_reveal_step": 1,
336
+ "first_retrieve_step": null,
337
+ "episode_disturbance": 0.3794685144275167
338
+ },
339
+ {
340
+ "episode_seed": 172034,
341
+ "success": true,
342
+ "steps": 2,
343
+ "first_reveal_step": 1,
344
+ "first_retrieve_step": null,
345
+ "episode_disturbance": 0.23963101771263
346
+ },
347
+ {
348
+ "episode_seed": 172035,
349
+ "success": true,
350
+ "steps": 3,
351
+ "first_reveal_step": 1,
352
+ "first_retrieve_step": null,
353
+ "episode_disturbance": 0.1458236509853299
354
+ },
355
+ {
356
+ "episode_seed": 172036,
357
+ "success": false,
358
+ "steps": 4,
359
+ "first_reveal_step": 1,
360
+ "first_retrieve_step": null,
361
+ "episode_disturbance": 0.0005504064674610731
362
+ },
363
+ {
364
+ "episode_seed": 172037,
365
+ "success": false,
366
+ "steps": 4,
367
+ "first_reveal_step": 1,
368
+ "first_retrieve_step": null,
369
+ "episode_disturbance": 0.02395525002599186
370
+ },
371
+ {
372
+ "episode_seed": 172038,
373
+ "success": true,
374
+ "steps": 4,
375
+ "first_reveal_step": 1,
376
+ "first_retrieve_step": null,
377
+ "episode_disturbance": 0.002132451383634048
378
+ },
379
+ {
380
+ "episode_seed": 172039,
381
+ "success": false,
382
+ "steps": 4,
383
+ "first_reveal_step": 1,
384
+ "first_retrieve_step": null,
385
+ "episode_disturbance": 0.0008329380843482188
386
+ },
387
+ {
388
+ "episode_seed": 172040,
389
+ "success": true,
390
+ "steps": 2,
391
+ "first_reveal_step": 1,
392
+ "first_retrieve_step": null,
393
+ "episode_disturbance": 0.06136600544187113
394
+ },
395
+ {
396
+ "episode_seed": 172041,
397
+ "success": true,
398
+ "steps": 1,
399
+ "first_reveal_step": 1,
400
+ "first_retrieve_step": null,
401
+ "episode_disturbance": 0.1345306197528089
402
+ },
403
+ {
404
+ "episode_seed": 172042,
405
+ "success": false,
406
+ "steps": 4,
407
+ "first_reveal_step": 1,
408
+ "first_retrieve_step": null,
409
+ "episode_disturbance": 0.15628500139711843
410
+ },
411
+ {
412
+ "episode_seed": 172043,
413
+ "success": false,
414
+ "steps": 4,
415
+ "first_reveal_step": 1,
416
+ "first_retrieve_step": null,
417
+ "episode_disturbance": 0.0589350413731123
418
+ },
419
+ {
420
+ "episode_seed": 172044,
421
+ "success": true,
422
+ "steps": 4,
423
+ "first_reveal_step": 1,
424
+ "first_retrieve_step": null,
425
+ "episode_disturbance": 0.0012772400607863332
426
+ },
427
+ {
428
+ "episode_seed": 172045,
429
+ "success": false,
430
+ "steps": 4,
431
+ "first_reveal_step": 1,
432
+ "first_retrieve_step": null,
433
+ "episode_disturbance": 0.014964900854341323
434
+ },
435
+ {
436
+ "episode_seed": 172046,
437
+ "success": false,
438
+ "steps": 4,
439
+ "first_reveal_step": 1,
440
+ "first_retrieve_step": null,
441
+ "episode_disturbance": 0.00010739007165527781
442
+ },
443
+ {
444
+ "episode_seed": 172047,
445
+ "success": false,
446
+ "steps": 4,
447
+ "first_reveal_step": 1,
448
+ "first_retrieve_step": null,
449
+ "episode_disturbance": 0.3118926811146435
450
+ },
451
+ {
452
+ "episode_seed": 172048,
453
+ "success": false,
454
+ "steps": 4,
455
+ "first_reveal_step": 1,
456
+ "first_retrieve_step": null,
457
+ "episode_disturbance": 0.09965736700647154
458
+ },
459
+ {
460
+ "episode_seed": 172049,
461
+ "success": true,
462
+ "steps": 3,
463
+ "first_reveal_step": 1,
464
+ "first_retrieve_step": null,
465
+ "episode_disturbance": 0.17035763711848637
466
+ }
467
+ ],
468
+ "eval_protocol": {
469
+ "track_id": "occlusion_track",
470
+ "suite": "maniskill3",
471
+ "benchmark_task": "PickClutterYCB-v1",
472
+ "role": "target",
473
+ "eval_mode": "adapter_noop",
474
+ "seed": 17,
475
+ "episodes": 50,
476
+ "resolution": 224,
477
+ "cameras": [
478
+ "front",
479
+ "left",
480
+ "right"
481
+ ],
482
+ "observation_stack": "rgbd_3cam",
483
+ "action_horizon": 8,
484
+ "action_space": "bimanual_delta_pose",
485
+ "same_test_episodes": true
486
+ },
487
+ "train_spec": {
488
+ "track_id": "occlusion_track",
489
+ "suite": "maniskill3",
490
+ "benchmark_task": "PickClutterYCB-v1",
491
+ "model_variant": "adapter_active_ft",
492
+ "seed": 17,
493
+ "train_demos": 32,
494
+ "val_demos": 8,
495
+ "init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
496
+ "optimizer": "adamw",
497
+ "learning_rate": 0.0001,
498
+ "lr_schedule": "constant",
499
+ "batch_size": 4,
500
+ "augmentations": "none",
501
+ "early_stopping_metric": "val_total",
502
+ "max_gradient_steps": 144,
503
+ "unfreeze_scope": "fusion_memory_decoder",
504
+ "dataset_split_id": "pickclutter_smoke_v2_seed17",
505
+ "same_data_policy": true,
506
+ "same_init_policy": true
507
+ }
508
+ }
reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "anchor_pass": true,
3
+ "available_tracks": [
4
+ "occlusion_track"
5
+ ],
6
+ "ci_above_zero_tracks": [
7
+ "occlusion_track"
8
+ ],
9
+ "headline_pass": true,
10
+ "package_name": "public_reveal_retrieve_package_v1",
11
+ "sign_of_life_pass": false,
12
+ "sign_of_life_track_count": 0,
13
+ "sign_of_life_tracks": [],
14
+ "target_macro_average_delta": 0.2799999937415123,
15
+ "tracks": {
16
+ "occlusion_track": {
17
+ "benchmark_task": "PickClutterYCB-v1",
18
+ "delta_active_vs_trunk": 0.2799999937415123,
19
+ "delta_active_vs_trunk_ci95": [
20
+ 0.14000000059604645,
21
+ 0.42050001621246064
22
+ ],
23
+ "delta_noop_vs_trunk": 0.2799999937415123,
24
+ "modes": {
25
+ "adapter_active_ft": {
26
+ "disturbance_proxy": 0.1261227352138143,
27
+ "intervention_rate": 0.0,
28
+ "mean_success": 0.3199999928474426,
29
+ "non_base_selection_rate": 0.0,
30
+ "num_runs": 1,
31
+ "steps_to_first_reveal_or_access": 1.0,
32
+ "steps_to_retrieve": 4.0
33
+ },
34
+ "adapter_noop": {
35
+ "disturbance_proxy": 0.1261227352138143,
36
+ "intervention_rate": 0.0,
37
+ "mean_success": 0.3199999928474426,
38
+ "non_base_selection_rate": 0.0,
39
+ "num_runs": 1,
40
+ "steps_to_first_reveal_or_access": 1.0,
41
+ "steps_to_retrieve": 4.0
42
+ },
43
+ "trunk_only_ft": {
44
+ "disturbance_proxy": 0.22772394362117063,
45
+ "intervention_rate": 0.0,
46
+ "mean_success": 0.03999999910593033,
47
+ "non_base_selection_rate": 0.0,
48
+ "num_runs": 1,
49
+ "steps_to_first_reveal_or_access": 1.0,
50
+ "steps_to_retrieve": 4.0
51
+ }
52
+ },
53
+ "notes": "Closest maintained public occluded retrieval task. Treat as the canopy / dense occlusion proxy.",
54
+ "public_source": "https://maniskill.readthedocs.io/en/latest/tasks/table_top_gripper/index.html",
55
+ "role": "target",
56
+ "signs_of_life": false,
57
+ "suite": "maniskill3",
58
+ "target_behavior": "retrieve a target object from dense occluding clutter",
59
+ "task_family": "dense_occluded_retrieval"
60
+ }
61
+ }
62
+ }
reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.md ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ManiSkill PickClutter Smoke Summary
2
+
3
+ - available_tracks: ['occlusion_track']
4
+ - target_macro_average_delta: 0.280
5
+ - headline_pass: True
6
+ - sign_of_life_pass: False
7
+
8
+ ## occlusion_track
9
+ - delta_active_vs_trunk: 0.280
10
+ - delta_noop_vs_trunk: 0.280
11
+ - signs_of_life: False
12
+ - trunk_only_ft: mean_success=0.040
13
+ - adapter_noop: mean_success=0.320
14
+ - adapter_active_ft: mean_success=0.320