Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- MODEL_AND_ARTIFACT_INDEX.md +47 -0
- README.md +363 -0
- code/VLAarchtests2_code/VLAarchtests/.pytest_cache/.gitignore +2 -0
- code/VLAarchtests2_code/VLAarchtests/.pytest_cache/CACHEDIR.TAG +4 -0
- code/VLAarchtests2_code/VLAarchtests/.pytest_cache/README.md +8 -0
- code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/lastfailed +1 -0
- code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/nodeids +11 -0
- code/VLAarchtests2_code/VLAarchtests/artifacts/generated_configs/public_benchmark_package_v1.json +80 -0
- code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-310.pyc +0 -0
- code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-311.pyc +0 -0
- code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/base.cpython-310.pyc +0 -0
- code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/procedural_envs.cpython-310.pyc +0 -0
- code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/proxy_specs.cpython-310.pyc +0 -0
- docs/maniskill_pickclutter_correction_log_2026-04-01.md +187 -0
- docs/minimum_sign_of_life_maniskill_pickclutter_run_2026-04-01.md +134 -0
- docs/public_benchmark_progress_2026-04-01.md +91 -0
- docs/public_bridge_smoke_run_log_2026-04-01.md +116 -0
- reports/anchor_dual_push_smoke/original_trunk/rollout_eval.partial.json +29 -0
- reports/anybimanual_anchor_bridge_live/trunk_only_ep5/stderr.txt +20 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_active_ft_seed23.json +131 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_noop_seed23.json +110 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/conservative/run.log +76 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_active_ft_seed23.json +131 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_noop_seed23.json +110 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.json +60 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.md +15 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/default/run.log +76 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/default/trunk_only_ft_seed23.json +131 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/public_benchmark_package_summary.md +15 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/trunk_only_ft_seed23.json +131 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/adapter_noop_seed23.json +110 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.json +60 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.md +15 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/run.log +76 -0
- reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/trunk_only_ft_seed23.json +131 -0
- reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed17.json +509 -0
- reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed23.json +509 -0
- reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed29.json +509 -0
- reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed17.json +488 -0
- reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed23.json +488 -0
- reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed29.json +488 -0
- reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.json +60 -0
- reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.md +15 -0
- reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed17.json +509 -0
- reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed23.json +509 -0
- reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed29.json +509 -0
- reports/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17.json +508 -0
- reports/maniskill_pickclutter_smoke_v2/adapter_noop_seed17.json +508 -0
- reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.json +62 -0
- reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.md +14 -0
MODEL_AND_ARTIFACT_INDEX.md
ADDED
|
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Model And Artifact Index
|
| 2 |
+
|
| 3 |
+
## Main Code Roots
|
| 4 |
+
|
| 5 |
+
- `code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/`
|
| 6 |
+
- `code/VLAarchtests2_code/VLAarchtests/tests/`
|
| 7 |
+
|
| 8 |
+
## Main Prior Handoff Roots
|
| 9 |
+
|
| 10 |
+
- `artifacts/`
|
| 11 |
+
- `docs/`
|
| 12 |
+
- `legacy/`
|
| 13 |
+
- `setup/`
|
| 14 |
+
|
| 15 |
+
## Main Current Public Benchmark Roots
|
| 16 |
+
|
| 17 |
+
- `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/`
|
| 18 |
+
- strongest current dense-occlusion result
|
| 19 |
+
- `reports/maniskill_bag_bridge_eval_less_bonus_seed17/`
|
| 20 |
+
- `reports/maniskill_bag_bridge_eval_less_bonus_seed23/`
|
| 21 |
+
- `reports/maniskill_bag_bridge_eval_less_bonus_2seed_manual_summary.json`
|
| 22 |
+
- `reports/maniskill_cloth_bridge_smoke_v1/`
|
| 23 |
+
- `reports/maniskill_cloth_bridge_val_sweep_seed23/`
|
| 24 |
+
|
| 25 |
+
## Main Current Checkpoint Roots
|
| 26 |
+
|
| 27 |
+
- `outputs/maniskill_pickclutter_smoke_v5/`
|
| 28 |
+
- `outputs/maniskill_bag_bridge_smoke_v1/`
|
| 29 |
+
- `outputs/maniskill_cloth_bridge_smoke_v1/`
|
| 30 |
+
|
| 31 |
+
## Main Current Dataset Roots
|
| 32 |
+
|
| 33 |
+
- `data/maniskill_pickclutter/`
|
| 34 |
+
- `data/maniskill_bridge_retrieval/`
|
| 35 |
+
- `data/reveal_proxy/`
|
| 36 |
+
|
| 37 |
+
## Main Current Docs
|
| 38 |
+
|
| 39 |
+
- `docs/maniskill_pickclutter_correction_log_2026-04-01.md`
|
| 40 |
+
- `docs/public_bridge_smoke_run_log_2026-04-01.md`
|
| 41 |
+
- `docs/minimum_sign_of_life_maniskill_pickclutter_run_2026-04-01.md`
|
| 42 |
+
|
| 43 |
+
## Repo History
|
| 44 |
+
|
| 45 |
+
- `history/VLAarchtests_previous_README.md`
|
| 46 |
+
- `history/VLAarchtests2_previous_README.md`
|
| 47 |
+
- `history/VLAarchtests3_previous_README.md`
|
README.md
ADDED
|
@@ -0,0 +1,363 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# VLAarchtests4
|
| 2 |
+
|
| 3 |
+
`VLAarchtests4` is the fresh organization repo for the RunPod work staged from `/workspace` on `2026-04-01 UTC`.
|
| 4 |
+
|
| 5 |
+
It carries forward the earlier repo lineage and adds the current public-sim benchmark package work:
|
| 6 |
+
|
| 7 |
+
- `VLAarchtests`
|
| 8 |
+
- early proxy + RLBench architecture search, handoff checkpoints, and environment recreation files from the `2026-03-25/26` sessions
|
| 9 |
+
- `VLAarchtests2`
|
| 10 |
+
- larger exploratory organization repo with more baselines, overlap/anchor work, frequent model changes, mixed artifacts, and several results that required later reinterpretation
|
| 11 |
+
- `VLAarchtests3`
|
| 12 |
+
- cleaned export focused on the elastic-occlusion `trunk + structured adapter + no-op fallback` refactor, validated tests, current checkpoints, and handoff docs
|
| 13 |
+
- `VLAarchtests4`
|
| 14 |
+
- keeps the `VLAarchtests3` export intact and adds the full current workspace `reports/`, `outputs/`, and `data/` trees, including all public benchmark smoke runs, checkpoint directories, dataset bundles, validation sweeps, and environment snapshots from the public-sim evaluation pass
|
| 15 |
+
|
| 16 |
+
## What This Repo Adds
|
| 17 |
+
|
| 18 |
+
The main new addition in this repo is the public benchmark track work for the elastic-occlusion adapter:
|
| 19 |
+
|
| 20 |
+
- real public-sim smoke runs on:
|
| 21 |
+
- ManiSkill `PickClutterYCB-v1` as the dense occluded retrieval proxy
|
| 22 |
+
- ManiSkill bridge basket retrieval proxy as the bag retrieval proxy
|
| 23 |
+
- ManiSkill bridge cloth retrieval proxy as the folded-cloth retrieval proxy
|
| 24 |
+
- the public benchmark package code and summaries
|
| 25 |
+
- the train/eval logs, checkpoints, cached datasets, validation sweeps, and correction logs for those runs
|
| 26 |
+
- the same-machine environment snapshot for the public benchmark stack used on this RunPod
|
| 27 |
+
|
| 28 |
+
## Top-Level Contents
|
| 29 |
+
|
| 30 |
+
- `code/`
|
| 31 |
+
- the cleaned code snapshot inherited from `VLAarchtests3`
|
| 32 |
+
- `artifacts/`
|
| 33 |
+
- prior staged checkpoints, proxy data, reports, and generated configs already bundled by `VLAarchtests3`
|
| 34 |
+
- `docs/`
|
| 35 |
+
- prior handoff/audit docs plus the current public benchmark run logs and correction notes
|
| 36 |
+
- `legacy/`
|
| 37 |
+
- older exact artifacts preserved by `VLAarchtests3`
|
| 38 |
+
- `setup/`
|
| 39 |
+
- prior environment files plus a new public benchmark environment snapshot under `setup/public_benchmark/`
|
| 40 |
+
- `history/`
|
| 41 |
+
- copied README history for `VLAarchtests`, `VLAarchtests2`, and `VLAarchtests3`
|
| 42 |
+
- `reports/`
|
| 43 |
+
- the full current `/workspace/workspace/reports` tree from this machine
|
| 44 |
+
- `outputs/`
|
| 45 |
+
- the full current `/workspace/workspace/outputs` tree from this machine
|
| 46 |
+
- `data/`
|
| 47 |
+
- the full current `/workspace/workspace/data` tree from this machine
|
| 48 |
+
- `PUBLIC_BENCHMARK_RESULTS.md`
|
| 49 |
+
- compact index of all public benchmark train/eval results from this session
|
| 50 |
+
- `MODEL_AND_ARTIFACT_INDEX.md`
|
| 51 |
+
- practical map of the main artifact roots to start from
|
| 52 |
+
|
| 53 |
+
## Architecture State Carried Forward
|
| 54 |
+
|
| 55 |
+
The core model family inherited from `VLAarchtests3` is still:
|
| 56 |
+
|
| 57 |
+
- `trunk_only`
|
| 58 |
+
- `adapter_noop`
|
| 59 |
+
- `adapter_active`
|
| 60 |
+
|
| 61 |
+
The important architectural state carried into the public benchmark work is:
|
| 62 |
+
|
| 63 |
+
- wrapped-policy interface with exact `trunk_only`, `adapter_noop`, and `adapter_active` modes
|
| 64 |
+
- structured reveal/retrieve adapter with:
|
| 65 |
+
- state prediction
|
| 66 |
+
- task-routed proposal families
|
| 67 |
+
- retrieve-feasibility gating
|
| 68 |
+
- lightweight transition model
|
| 69 |
+
- planner/reranker
|
| 70 |
+
- planner fixes that replaced hard vetoes with softer stage penalties in:
|
| 71 |
+
- `code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/models/planner.py`
|
| 72 |
+
|
| 73 |
+
## Public Benchmark Summary
|
| 74 |
+
|
| 75 |
+
Detailed per-run results are in `PUBLIC_BENCHMARK_RESULTS.md`. The short version is:
|
| 76 |
+
|
| 77 |
+
### 1. Dense occluded retrieval proxy
|
| 78 |
+
|
| 79 |
+
Benchmark:
|
| 80 |
+
|
| 81 |
+
- ManiSkill `PickClutterYCB-v1`
|
| 82 |
+
|
| 83 |
+
Best current held-out result:
|
| 84 |
+
|
| 85 |
+
- directory:
|
| 86 |
+
- `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/`
|
| 87 |
+
- summary:
|
| 88 |
+
- `trunk_only_ft = 0.04`
|
| 89 |
+
- `adapter_noop = 0.04`
|
| 90 |
+
- `adapter_active_ft = 0.62`
|
| 91 |
+
- `delta_active_vs_trunk = +0.58`
|
| 92 |
+
- `95% CI = [0.44, 0.72]`
|
| 93 |
+
- `intervention_rate = 1.0`
|
| 94 |
+
- `non_base_selection_rate = 1.0`
|
| 95 |
+
|
| 96 |
+
Important caveat:
|
| 97 |
+
|
| 98 |
+
- this was not a new retrain after `smoke_v5`
|
| 99 |
+
- it used the same `smoke_v5` checkpoints with planner hyperparameters selected on the frozen validation split and then applied once to the untouched held-out split
|
| 100 |
+
|
| 101 |
+
### 2. Bag retrieval proxy
|
| 102 |
+
|
| 103 |
+
Benchmark:
|
| 104 |
+
|
| 105 |
+
- public ManiSkill bridge basket retrieval proxy
|
| 106 |
+
|
| 107 |
+
Current fair read:
|
| 108 |
+
|
| 109 |
+
- seed `17` corrected held-out:
|
| 110 |
+
- `trunk = 0.32`
|
| 111 |
+
- `noop = 0.00`
|
| 112 |
+
- `active = 0.48`
|
| 113 |
+
- seed `23` corrected held-out:
|
| 114 |
+
- `trunk = 0.48`
|
| 115 |
+
- `noop = 0.08`
|
| 116 |
+
- `active = 0.48`
|
| 117 |
+
- corrected 2-seed aggregate:
|
| 118 |
+
- `trunk = 0.40`
|
| 119 |
+
- `noop = 0.04`
|
| 120 |
+
- `active = 0.48`
|
| 121 |
+
- `delta = +0.08`
|
| 122 |
+
|
| 123 |
+
Interpretation:
|
| 124 |
+
|
| 125 |
+
- bag remains modestly positive after using one consistent corrected planner across seeds
|
| 126 |
+
- the effect is smaller and less clean than the best occlusion result
|
| 127 |
+
|
| 128 |
+
### 3. Cloth retrieval proxy
|
| 129 |
+
|
| 130 |
+
Benchmark:
|
| 131 |
+
|
| 132 |
+
- public ManiSkill bridge cloth retrieval proxy
|
| 133 |
+
|
| 134 |
+
Current read:
|
| 135 |
+
|
| 136 |
+
- seed `17`:
|
| 137 |
+
- `trunk = 0.04`
|
| 138 |
+
- `noop = 0.04`
|
| 139 |
+
- `active = 0.10`
|
| 140 |
+
- seed `23`:
|
| 141 |
+
- `trunk = 0.04`
|
| 142 |
+
- `noop = 0.02`
|
| 143 |
+
- `active = 0.02`
|
| 144 |
+
- seed `29`:
|
| 145 |
+
- `trunk = 0.04`
|
| 146 |
+
- `noop = 0.04`
|
| 147 |
+
- `active = 0.04`
|
| 148 |
+
- 3-seed aggregate:
|
| 149 |
+
- `trunk = 0.0400`
|
| 150 |
+
- `noop = 0.0333`
|
| 151 |
+
- `active = 0.0533`
|
| 152 |
+
- `delta = +0.0133`
|
| 153 |
+
|
| 154 |
+
Interpretation:
|
| 155 |
+
|
| 156 |
+
- cloth is weak and unstable
|
| 157 |
+
- current evidence does not support a strong cloth-specific win
|
| 158 |
+
|
| 159 |
+
## Important Fairness Notes
|
| 160 |
+
|
| 161 |
+
The fairness story is mixed and should be stated plainly.
|
| 162 |
+
|
| 163 |
+
What is fair in the strongest public benchmark result:
|
| 164 |
+
|
| 165 |
+
- same initialization checkpoint for `trunk_only_ft` and `adapter_active_ft`
|
| 166 |
+
- same train/val/test split within each task
|
| 167 |
+
- same optimizer, LR, batch size, and unfreeze scope within each task
|
| 168 |
+
- `adapter_noop` is evaluated from the same adapter checkpoint as `adapter_active_ft`
|
| 169 |
+
- the held-out test episodes were not hand-picked after seeing outcomes
|
| 170 |
+
|
| 171 |
+
What is not fully paper-clean yet:
|
| 172 |
+
|
| 173 |
+
- most current public benchmark evidence is smoke-scale and low-seed
|
| 174 |
+
- the occlusion headline result depends on validation-selected planner tuning on top of a fixed checkpoint
|
| 175 |
+
- bag required eval-side planner correction for one seed to avoid a collapse
|
| 176 |
+
- cloth remains weak even after additional seeds and val sweeps
|
| 177 |
+
|
| 178 |
+
### PickClutter Split Fairness
|
| 179 |
+
|
| 180 |
+
The important point for the dense-occlusion track is that the dataset split did not drift across the early smoke versions.
|
| 181 |
+
|
| 182 |
+
- `data/maniskill_pickclutter/smoke_v1/episode_splits.json`
|
| 183 |
+
- `data/maniskill_pickclutter/smoke_v2/episode_splits.json`
|
| 184 |
+
- `data/maniskill_pickclutter/smoke_v3/episode_splits.json`
|
| 185 |
+
|
| 186 |
+
These files contain the same episode ids:
|
| 187 |
+
|
| 188 |
+
- train: `170000..170031`
|
| 189 |
+
- val: `171000..171007`
|
| 190 |
+
- eval: `172000..172049`
|
| 191 |
+
|
| 192 |
+
Also:
|
| 193 |
+
|
| 194 |
+
- there is no `data/maniskill_pickclutter/smoke_v4/`
|
| 195 |
+
- there is no `data/maniskill_pickclutter/smoke_v5/`
|
| 196 |
+
|
| 197 |
+
`smoke_v4` and `smoke_v5` were code/report version labels, not new held-out episode bundles.
|
| 198 |
+
|
| 199 |
+
### What Changed Across PickClutter Versions
|
| 200 |
+
|
| 201 |
+
The big changes across `smoke_v2`, `smoke_v3`, `smoke_v4`, and `smoke_v5` were:
|
| 202 |
+
|
| 203 |
+
- more benchmark-derived state supervision
|
| 204 |
+
- transition-model training enablement
|
| 205 |
+
- planner bug fixes
|
| 206 |
+
- fairness fixes so the adapter checkpoint did not hide a stronger shared trunk
|
| 207 |
+
- then a frozen-validation planner sweep for the final held-out eval
|
| 208 |
+
|
| 209 |
+
The big occlusion win was not caused by changing the eval episodes.
|
| 210 |
+
|
| 211 |
+
## Crucial Caveats
|
| 212 |
+
|
| 213 |
+
### Occlusion result was planner-tuned
|
| 214 |
+
|
| 215 |
+
The large jump in:
|
| 216 |
+
|
| 217 |
+
- `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/`
|
| 218 |
+
|
| 219 |
+
came from validation-selected planner tuning on top of the same `smoke_v5` checkpoint.
|
| 220 |
+
|
| 221 |
+
The selected override values were:
|
| 222 |
+
|
| 223 |
+
- `mode_preference_bonus = 0.75`
|
| 224 |
+
- `premature_retrieve_penalty = 0.5`
|
| 225 |
+
- `premature_insert_penalty = 0.25`
|
| 226 |
+
- `premature_maintain_penalty = 1.0`
|
| 227 |
+
- `occlusion_maintain_gap_min_access = 0.30`
|
| 228 |
+
- `occlusion_maintain_gap_min_visibility = 0.20`
|
| 229 |
+
- `retrieve_stage_access_threshold = 0.18`
|
| 230 |
+
- `retrieve_stage_reveal_threshold = 0.18`
|
| 231 |
+
- `retrieve_stage_support_threshold = 0.18`
|
| 232 |
+
|
| 233 |
+
That was a validation-only selection step. It was not a fresh retrain.
|
| 234 |
+
|
| 235 |
+
### Bag and cloth did not use real depth
|
| 236 |
+
|
| 237 |
+
The bridge-task runner for the bag and cloth proxies used:
|
| 238 |
+
|
| 239 |
+
- one real RGB camera
|
| 240 |
+
- copied into all camera slots
|
| 241 |
+
- zero-filled depth channels
|
| 242 |
+
|
| 243 |
+
The runner labels this stack:
|
| 244 |
+
|
| 245 |
+
- `rgb_triplicate_zero_depth`
|
| 246 |
+
|
| 247 |
+
This is a real limitation and it should not be hidden.
|
| 248 |
+
|
| 249 |
+
It happened because the bridge proxy runner used a compatibility shim to satisfy the shared multi-camera tensor interface without plumbing real bridge-scene multiview depth through the stack.
|
| 250 |
+
|
| 251 |
+
Consequences:
|
| 252 |
+
|
| 253 |
+
- bag and cloth are not modality-matched to the PickClutter runs
|
| 254 |
+
- PickClutter used real `rgbd_3cam`
|
| 255 |
+
- bag and cloth used weaker perception input
|
| 256 |
+
|
| 257 |
+
### Bag and cloth also used a different control wrapper
|
| 258 |
+
|
| 259 |
+
PickClutter:
|
| 260 |
+
|
| 261 |
+
- observation stack: `rgbd_3cam`
|
| 262 |
+
- action space: `bimanual_delta_pose`
|
| 263 |
+
|
| 264 |
+
Bag and cloth:
|
| 265 |
+
|
| 266 |
+
- observation stack: `rgb_triplicate_zero_depth`
|
| 267 |
+
- action space: `widowx_delta_pose`
|
| 268 |
+
|
| 269 |
+
So the cross-track story is architecture-consistent but not fully input/control-identical.
|
| 270 |
+
|
| 271 |
+
### `smoke_v4_evalprobe_fromv3` is not a clean retrain result
|
| 272 |
+
|
| 273 |
+
This run:
|
| 274 |
+
|
| 275 |
+
- `reports/maniskill_pickclutter_smoke_v4_evalprobe_fromv3/`
|
| 276 |
+
|
| 277 |
+
used corrected planner logic on top of `smoke_v3` weights. It is useful evidence that the active adapter can matter, but it is not a clean end-to-end retrain.
|
| 278 |
+
|
| 279 |
+
## What Was Actually Learned
|
| 280 |
+
|
| 281 |
+
The current repo supports the following claims:
|
| 282 |
+
|
| 283 |
+
- the structured adapter is still alive
|
| 284 |
+
- the active branch can clearly matter on a real public dense-occlusion benchmark proxy
|
| 285 |
+
- `adapter_noop` remains a useful fairness control
|
| 286 |
+
- bag-like retrieval still shows modest positive evidence
|
| 287 |
+
- cloth-like retrieval is currently the weak link
|
| 288 |
+
|
| 289 |
+
It does not support the following stronger claims yet:
|
| 290 |
+
|
| 291 |
+
- broad superiority on realistic manipulation benchmarks
|
| 292 |
+
- stable multi-seed wins across all three target-like public proxy tracks
|
| 293 |
+
- a clean modality-matched comparison across occlusion, bag, and cloth
|
| 294 |
+
|
| 295 |
+
## Environment And Setup
|
| 296 |
+
|
| 297 |
+
Two environment stories exist in this repo.
|
| 298 |
+
|
| 299 |
+
### Prior `VLAarchtests3` / RLBench stack
|
| 300 |
+
|
| 301 |
+
Preserved under:
|
| 302 |
+
|
| 303 |
+
- `setup/ENVIRONMENT.md`
|
| 304 |
+
- `setup/env_vars.sh`
|
| 305 |
+
- `setup/rlbench_pip_freeze.txt`
|
| 306 |
+
|
| 307 |
+
This is the older RLBench / AnyBimanual oriented environment.
|
| 308 |
+
|
| 309 |
+
### Current public benchmark stack
|
| 310 |
+
|
| 311 |
+
Preserved under:
|
| 312 |
+
|
| 313 |
+
- `setup/public_benchmark/ENVIRONMENT.md`
|
| 314 |
+
- `setup/public_benchmark/env_vars.sh`
|
| 315 |
+
- `setup/public_benchmark/python_version.txt`
|
| 316 |
+
- `setup/public_benchmark/uname.txt`
|
| 317 |
+
- `setup/public_benchmark/nvidia_smi.txt`
|
| 318 |
+
- `setup/public_benchmark/gpu_short.txt`
|
| 319 |
+
- `setup/public_benchmark/pip_freeze_python311.txt`
|
| 320 |
+
- `setup/public_benchmark/rlbench_env_pip_freeze.txt`
|
| 321 |
+
- `setup/public_benchmark/hf_env.txt`
|
| 322 |
+
|
| 323 |
+
The public benchmark runs in this session were assembled on:
|
| 324 |
+
|
| 325 |
+
- GPU: `NVIDIA L40S`
|
| 326 |
+
- VRAM: `46068 MiB`
|
| 327 |
+
- driver: `580.126.09`
|
| 328 |
+
- Python: `3.11.10`
|
| 329 |
+
- kernel: `Linux 6.8.0-88-generic`
|
| 330 |
+
|
| 331 |
+
## Recommended Starting Points
|
| 332 |
+
|
| 333 |
+
If you want the strongest current public benchmark evidence, start here:
|
| 334 |
+
|
| 335 |
+
- `docs/maniskill_pickclutter_correction_log_2026-04-01.md`
|
| 336 |
+
- `reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
|
| 337 |
+
|
| 338 |
+
If you want the bag/cloth public bridge follow-up, start here:
|
| 339 |
+
|
| 340 |
+
- `docs/public_bridge_smoke_run_log_2026-04-01.md`
|
| 341 |
+
- `reports/maniskill_bag_bridge_eval_less_bonus_2seed_manual_summary.json`
|
| 342 |
+
- `reports/maniskill_cloth_bridge_val_sweep_seed23/summary.json`
|
| 343 |
+
|
| 344 |
+
If you want the repo lineage context, start here:
|
| 345 |
+
|
| 346 |
+
- `history/VLAarchtests_previous_README.md`
|
| 347 |
+
- `history/VLAarchtests2_previous_README.md`
|
| 348 |
+
- `history/VLAarchtests3_previous_README.md`
|
| 349 |
+
|
| 350 |
+
## Bottom Line
|
| 351 |
+
|
| 352 |
+
This repo is the complete organization package for the current workspace state.
|
| 353 |
+
|
| 354 |
+
It includes:
|
| 355 |
+
|
| 356 |
+
- the `VLAarchtests3` export base
|
| 357 |
+
- the full current machine `reports/`, `outputs/`, and `data/` trees
|
| 358 |
+
- the public benchmark code, datasets, checkpoints, and results
|
| 359 |
+
- the environment files needed to stand up the same stack on similar hardware
|
| 360 |
+
|
| 361 |
+
Use it as the archival handoff state for continuing the elastic-occlusion adapter work.
|
| 362 |
+
|
| 363 |
+
Do not cite it as if all three target-like public proxy tracks are already cleanly solved. The occlusion track is the strongest current evidence; bag is modest; cloth remains weak; and the bridge-task perception stack still needs a proper real-depth rewrite.
|
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/.gitignore
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Created by pytest automatically.
|
| 2 |
+
*
|
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/CACHEDIR.TAG
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Signature: 8a477f597d28d172789f06886806bc55
|
| 2 |
+
# This file is a cache directory tag created by pytest.
|
| 3 |
+
# For information about cache directory tags, see:
|
| 4 |
+
# https://bford.info/cachedir/spec.html
|
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/README.md
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# pytest cache directory #
|
| 2 |
+
|
| 3 |
+
This directory contains data from the pytest's cache plugin,
|
| 4 |
+
which provides the `--lf` and `--ff` options, as well as the `cache` fixture.
|
| 5 |
+
|
| 6 |
+
**Do not** commit this to version control.
|
| 7 |
+
|
| 8 |
+
See [the docs](https://docs.pytest.org/en/stable/how-to/cache.html) for more information.
|
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/lastfailed
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{}
|
code/VLAarchtests2_code/VLAarchtests/.pytest_cache/v/cache/nodeids
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
"tests/test_eval_toggle_paths_work.py::test_eval_toggle_paths_work",
|
| 3 |
+
"tests/test_general_eval_protocol_is_identical.py::test_general_eval_protocol_is_identical_across_modes",
|
| 4 |
+
"tests/test_public_benchmark_package_summary.py::test_public_benchmark_package_detects_training_mismatch",
|
| 5 |
+
"tests/test_public_benchmark_package_summary.py::test_public_benchmark_package_summary_passes_with_clear_gain",
|
| 6 |
+
"tests/test_public_benchmark_package_tracks.py::test_public_anchor_protocol_identity_is_mode_invariant",
|
| 7 |
+
"tests/test_public_benchmark_package_tracks.py::test_public_benchmark_package_contains_expected_tracks",
|
| 8 |
+
"tests/test_public_benchmark_package_tracks.py::test_public_target_protocol_identity_is_mode_invariant",
|
| 9 |
+
"tests/test_public_benchmark_package_tracks.py::test_public_track_roles_are_partitioned",
|
| 10 |
+
"tests/test_public_benchmark_package_tracks.py::test_training_fairness_signature_matches_for_trunk_and_adapter"
|
| 11 |
+
]
|
code/VLAarchtests2_code/VLAarchtests/artifacts/generated_configs/public_benchmark_package_v1.json
ADDED
|
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"anchor_eval_modes": [
|
| 3 |
+
"trunk_only",
|
| 4 |
+
"adapter_noop",
|
| 5 |
+
"adapter_active"
|
| 6 |
+
],
|
| 7 |
+
"anchor_track_ids": [
|
| 8 |
+
"anchor_track"
|
| 9 |
+
],
|
| 10 |
+
"defaults": {
|
| 11 |
+
"anchor_episodes": 25,
|
| 12 |
+
"resolution": 256,
|
| 13 |
+
"target_test_episodes": 100,
|
| 14 |
+
"target_train_demos": 64,
|
| 15 |
+
"target_val_demos": 16
|
| 16 |
+
},
|
| 17 |
+
"package_name": "public_reveal_retrieve_package_v1",
|
| 18 |
+
"target_eval_modes": [
|
| 19 |
+
"trunk_only_ft",
|
| 20 |
+
"adapter_noop",
|
| 21 |
+
"adapter_active_ft"
|
| 22 |
+
],
|
| 23 |
+
"target_track_ids": [
|
| 24 |
+
"bag_track",
|
| 25 |
+
"occlusion_track",
|
| 26 |
+
"cloth_track"
|
| 27 |
+
],
|
| 28 |
+
"thresholds": {
|
| 29 |
+
"anchor_tolerance": 0.02,
|
| 30 |
+
"sign_of_life_intervention_rate": 0.15,
|
| 31 |
+
"sign_of_life_non_base_selection_rate": 0.15,
|
| 32 |
+
"sign_of_life_success_gain": 0.05
|
| 33 |
+
},
|
| 34 |
+
"tracks": [
|
| 35 |
+
{
|
| 36 |
+
"benchmark_task": "unpacking_childs_bag-0",
|
| 37 |
+
"notes": "Closest public bag retrieval task. Treat as the benchmark-standard bag opening / retrieval slice.",
|
| 38 |
+
"public_source": "https://behavior.stanford.edu/knowledgebase/tasks/",
|
| 39 |
+
"role": "target",
|
| 40 |
+
"success_metric": "success_rate",
|
| 41 |
+
"suite": "behavior1k",
|
| 42 |
+
"target_behavior": "retrieve target objects from an opened compliant bag or backpack",
|
| 43 |
+
"task_family": "bag_retrieval",
|
| 44 |
+
"track_id": "bag_track"
|
| 45 |
+
},
|
| 46 |
+
{
|
| 47 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 48 |
+
"notes": "Closest maintained public occluded retrieval task. Treat as the canopy / dense occlusion proxy.",
|
| 49 |
+
"public_source": "https://maniskill.readthedocs.io/en/latest/tasks/table_top_gripper/index.html",
|
| 50 |
+
"role": "target",
|
| 51 |
+
"success_metric": "success_rate",
|
| 52 |
+
"suite": "maniskill3",
|
| 53 |
+
"target_behavior": "retrieve a target object from dense occluding clutter",
|
| 54 |
+
"task_family": "dense_occluded_retrieval",
|
| 55 |
+
"track_id": "occlusion_track"
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"benchmark_task": "grasp_protocol_stacked_garment",
|
| 59 |
+
"notes": "Use the GarmentLab grasp protocol in stacked/clutter layouts as the closest public cloth retrieval benchmark slice.",
|
| 60 |
+
"public_source": "https://garmentlab.readthedocs.io/en/latest/tutorial/realworldbenchmark/index.html",
|
| 61 |
+
"role": "target",
|
| 62 |
+
"success_metric": "success_rate",
|
| 63 |
+
"suite": "garmentlab",
|
| 64 |
+
"target_behavior": "retrieve a hidden or partially covered object from stacked or cluttered garments",
|
| 65 |
+
"task_family": "cloth_retrieval",
|
| 66 |
+
"track_id": "cloth_track"
|
| 67 |
+
},
|
| 68 |
+
{
|
| 69 |
+
"benchmark_task": "dual_push_buttons",
|
| 70 |
+
"notes": "Trusted public anchor on this setup. Keep as a no-regression track only.",
|
| 71 |
+
"public_source": "https://arxiv.org/abs/2412.06779",
|
| 72 |
+
"role": "anchor",
|
| 73 |
+
"success_metric": "success_rate",
|
| 74 |
+
"suite": "anybimanual",
|
| 75 |
+
"target_behavior": "generic bimanual control regression anchor",
|
| 76 |
+
"task_family": "generic_anchor",
|
| 77 |
+
"track_id": "anchor_track"
|
| 78 |
+
}
|
| 79 |
+
]
|
| 80 |
+
}
|
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-310.pyc
ADDED
|
Binary file (615 Bytes). View file
|
|
|
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/__init__.cpython-311.pyc
ADDED
|
Binary file (726 Bytes). View file
|
|
|
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/base.cpython-310.pyc
ADDED
|
Binary file (1.41 kB). View file
|
|
|
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/procedural_envs.cpython-310.pyc
ADDED
|
Binary file (42.5 kB). View file
|
|
|
code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/sim_reveal/__pycache__/proxy_specs.cpython-310.pyc
ADDED
|
Binary file (4.28 kB). View file
|
|
|
docs/maniskill_pickclutter_correction_log_2026-04-01.md
ADDED
|
@@ -0,0 +1,187 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# ManiSkill PickClutter Correction Log (2026-04-01)
|
| 2 |
+
|
| 3 |
+
## Scope
|
| 4 |
+
|
| 5 |
+
Public benchmark:
|
| 6 |
+
|
| 7 |
+
- ManiSkill 3 `PickClutterYCB-v1`
|
| 8 |
+
|
| 9 |
+
Frozen public split reused across all runs:
|
| 10 |
+
|
| 11 |
+
- train demos: `32` episodes
|
| 12 |
+
- val demos: `8` episodes
|
| 13 |
+
- eval episodes: `50`
|
| 14 |
+
- seed: `17`
|
| 15 |
+
- data bundle: `/workspace/workspace/data/maniskill_pickclutter/smoke_v3`
|
| 16 |
+
|
| 17 |
+
Fair comparison modes:
|
| 18 |
+
|
| 19 |
+
- `trunk_only_ft`
|
| 20 |
+
- `adapter_noop`
|
| 21 |
+
- `adapter_active_ft`
|
| 22 |
+
|
| 23 |
+
## Code Changes
|
| 24 |
+
|
| 25 |
+
Runner changes:
|
| 26 |
+
|
| 27 |
+
- enabled candidate rollout supervision from real ManiSkill states
|
| 28 |
+
- enabled adapter transition-model training/eval
|
| 29 |
+
- unfroze `adapter.transition_model`
|
| 30 |
+
- set non-zero transition loss weight
|
| 31 |
+
- added ManiSkill smoke planner overrides for the occlusion proxy:
|
| 32 |
+
- `adapter_confidence_threshold=0.50`
|
| 33 |
+
- `retrieve_access_threshold=0.08`
|
| 34 |
+
- `retrieve_persistence_threshold=0.12`
|
| 35 |
+
- `retrieve_support_threshold=0.08`
|
| 36 |
+
- `retrieve_reocclusion_threshold=0.92`
|
| 37 |
+
|
| 38 |
+
Planner correction:
|
| 39 |
+
|
| 40 |
+
- changed adapter stage rules from hard vetoes to soft penalties in
|
| 41 |
+
`/workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/models/planner.py`
|
| 42 |
+
|
| 43 |
+
## Runs
|
| 44 |
+
|
| 45 |
+
### 1. `smoke_v3` corrected-train baseline
|
| 46 |
+
|
| 47 |
+
Artifacts:
|
| 48 |
+
|
| 49 |
+
- summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v3/public_benchmark_package_summary.json`
|
| 50 |
+
|
| 51 |
+
Result:
|
| 52 |
+
|
| 53 |
+
- `trunk_only_ft=0.06`
|
| 54 |
+
- `adapter_noop=0.06`
|
| 55 |
+
- `adapter_active_ft=0.06`
|
| 56 |
+
- `intervention_rate=0.0`
|
| 57 |
+
- `non_base_selection_rate=0.0`
|
| 58 |
+
|
| 59 |
+
Interpretation:
|
| 60 |
+
|
| 61 |
+
- rollout supervision and transition-model training alone were not enough
|
| 62 |
+
- the adapter remained inert
|
| 63 |
+
|
| 64 |
+
### 2. `smoke_v4_evalprobe_fromv3` corrected-planner eval on `smoke_v3` weights
|
| 65 |
+
|
| 66 |
+
Artifacts:
|
| 67 |
+
|
| 68 |
+
- summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v4_evalprobe_fromv3/public_benchmark_package_summary.json`
|
| 69 |
+
|
| 70 |
+
Result:
|
| 71 |
+
|
| 72 |
+
- `trunk_only_ft=0.06`
|
| 73 |
+
- `adapter_noop=0.06`
|
| 74 |
+
- `adapter_active_ft=0.62`
|
| 75 |
+
- `delta_active_vs_trunk=+0.56`
|
| 76 |
+
- `95% CI=[+0.40, +0.70]`
|
| 77 |
+
- `intervention_rate=1.0`
|
| 78 |
+
- `non_base_selection_rate=1.0`
|
| 79 |
+
|
| 80 |
+
Interpretation:
|
| 81 |
+
|
| 82 |
+
- this is the first real adapter-specific sign of life on the public benchmark
|
| 83 |
+
- the corrected planner logic is doing the work
|
| 84 |
+
- the improvement is not coming from the shared trunk, because `adapter_noop` stayed at `0.06`
|
| 85 |
+
|
| 86 |
+
### 3. `smoke_v4` clean retrain with corrected planner active during train and eval
|
| 87 |
+
|
| 88 |
+
Artifacts:
|
| 89 |
+
|
| 90 |
+
- summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v4/public_benchmark_package_summary.json`
|
| 91 |
+
|
| 92 |
+
Result:
|
| 93 |
+
|
| 94 |
+
- `trunk_only_ft=0.48`
|
| 95 |
+
- `adapter_noop=0.04`
|
| 96 |
+
- `adapter_active_ft=0.04`
|
| 97 |
+
- `intervention_rate=1.0`
|
| 98 |
+
- `non_base_selection_rate=1.0`
|
| 99 |
+
- `delta_active_vs_trunk=-0.44`
|
| 100 |
+
|
| 101 |
+
Interpretation:
|
| 102 |
+
|
| 103 |
+
- the clean retrain under corrected planner logic is unstable / regressive
|
| 104 |
+
- the adapter-trained checkpoint collapsed even though active mode intervened
|
| 105 |
+
- current evidence supports the corrected planner as a real eval-time model fix, but not yet as a stable retrain recipe
|
| 106 |
+
|
| 107 |
+
### 4. `smoke_v5` fair retrain with trunk-action supervision preserved inside adapter training
|
| 108 |
+
|
| 109 |
+
Artifacts:
|
| 110 |
+
|
| 111 |
+
- summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5/public_benchmark_package_summary.json`
|
| 112 |
+
|
| 113 |
+
Result:
|
| 114 |
+
|
| 115 |
+
- `trunk_only_ft=0.04`
|
| 116 |
+
- `adapter_noop=0.04`
|
| 117 |
+
- `adapter_active_ft=0.04`
|
| 118 |
+
- `intervention_rate=1.0`
|
| 119 |
+
- `non_base_selection_rate=1.0`
|
| 120 |
+
- `delta_active_vs_trunk=0.00`
|
| 121 |
+
|
| 122 |
+
Interpretation:
|
| 123 |
+
|
| 124 |
+
- this fixed the fairness problem from `smoke_v4`: the adapter-trained checkpoint no longer hid a stronger trunk, because `adapter_noop` matched `trunk_only_ft`
|
| 125 |
+
- but the active branch still failed because the planner collapsed to `maintain_gap` on every decision
|
| 126 |
+
|
| 127 |
+
### 5. `smoke_v5_val_sweep` and held-out `smoke_v5_eval_tuned_softerpref`
|
| 128 |
+
|
| 129 |
+
Artifacts:
|
| 130 |
+
|
| 131 |
+
- val sweep: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_val_sweep/summary.json`
|
| 132 |
+
- held-out summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
|
| 133 |
+
|
| 134 |
+
Val-selected planner override:
|
| 135 |
+
|
| 136 |
+
- `mode_preference_bonus=0.75`
|
| 137 |
+
- `premature_retrieve_penalty=0.5`
|
| 138 |
+
- `premature_insert_penalty=0.25`
|
| 139 |
+
- `premature_maintain_penalty=1.0`
|
| 140 |
+
- `occlusion_maintain_gap_min_access=0.30`
|
| 141 |
+
- `occlusion_maintain_gap_min_visibility=0.20`
|
| 142 |
+
- `retrieve_stage_access_threshold=0.18`
|
| 143 |
+
- `retrieve_stage_reveal_threshold=0.18`
|
| 144 |
+
- `retrieve_stage_support_threshold=0.18`
|
| 145 |
+
|
| 146 |
+
Validation result:
|
| 147 |
+
|
| 148 |
+
- `baseline_corrected=0.00`
|
| 149 |
+
- `soft_pref=0.00`
|
| 150 |
+
- `softer_pref=0.625`
|
| 151 |
+
- `retrieve_open=0.625`
|
| 152 |
+
|
| 153 |
+
Held-out result:
|
| 154 |
+
|
| 155 |
+
- `trunk_only_ft=0.04`
|
| 156 |
+
- `adapter_noop=0.04`
|
| 157 |
+
- `adapter_active_ft=0.62`
|
| 158 |
+
- `delta_active_vs_trunk=+0.58`
|
| 159 |
+
- `95% CI=[+0.44, +0.72]`
|
| 160 |
+
- `intervention_rate=1.0`
|
| 161 |
+
- `non_base_selection_rate=1.0`
|
| 162 |
+
- `steps_to_retrieve=1.0`
|
| 163 |
+
- `signs_of_life=true`
|
| 164 |
+
|
| 165 |
+
Interpretation:
|
| 166 |
+
|
| 167 |
+
- this is a fair held-out public-benchmark win on the dense-occlusion proxy
|
| 168 |
+
- the gain is adapter-specific because `adapter_noop` stayed flat with the trunk baseline
|
| 169 |
+
- the fixed checkpoint from `smoke_v5` was viable; the missing piece was planner-stage calibration on the frozen validation split
|
| 170 |
+
|
| 171 |
+
## Current Best Public-Benchmark Evidence
|
| 172 |
+
|
| 173 |
+
Best adapter-specific evidence currently available:
|
| 174 |
+
|
| 175 |
+
- `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
|
| 176 |
+
|
| 177 |
+
Why this is the strongest result:
|
| 178 |
+
|
| 179 |
+
- same frozen public train/val/eval split
|
| 180 |
+
- same trained trunk baseline and adapter checkpoint
|
| 181 |
+
- planner override selected on the frozen validation split before the held-out eval run
|
| 182 |
+
- `adapter_noop` isolates the shared-trunk effect and stays flat
|
| 183 |
+
- only `adapter_active_ft` improves, so the gain is caused by live adapter intervention
|
| 184 |
+
|
| 185 |
+
## Open Problem
|
| 186 |
+
|
| 187 |
+
The dense-occlusion proxy now has a fair held-out win, but bag-style and cloth-style public proxy tracks are still missing. The next work item is to bring up the next public proxy benchmark instead of re-running more occlusion-only sweeps.
|
docs/minimum_sign_of_life_maniskill_pickclutter_run_2026-04-01.md
ADDED
|
@@ -0,0 +1,134 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Minimum Sign-of-Life Runbook: ManiSkill PickClutterYCB-v1
|
| 2 |
+
|
| 3 |
+
Date: 2026-04-01
|
| 4 |
+
|
| 5 |
+
## Goal
|
| 6 |
+
|
| 7 |
+
Run one real public-benchmark smoke on ManiSkill `PickClutterYCB-v1` that fairly compares:
|
| 8 |
+
|
| 9 |
+
- `trunk_only_ft`
|
| 10 |
+
- `adapter_noop`
|
| 11 |
+
- `adapter_active_ft`
|
| 12 |
+
|
| 13 |
+
The target claim for this run is narrow:
|
| 14 |
+
|
| 15 |
+
- on dense occluded retrieval, the adapter should visibly intervene and beat the trunk-only control trained on the same data;
|
| 16 |
+
- this is a minimum-sign-of-life run, not the full 3-track package.
|
| 17 |
+
|
| 18 |
+
## Correction After First Failed Smoke
|
| 19 |
+
|
| 20 |
+
The first smoke run confirmed that the real ManiSkill benchmark path worked, but the adapter stayed inert because the smoke dataset only supervised proposal ranking. The corrected run keeps the same benchmark and fairness contract and restarts both trained variants from the same init on the same frozen split, but adds benchmark-derived current-state supervision for the adapter:
|
| 21 |
+
|
| 22 |
+
- `support_mode`
|
| 23 |
+
- `corridor_feasible`
|
| 24 |
+
- `persistence_horizon`
|
| 25 |
+
- `disturbance_cost`
|
| 26 |
+
- selected task metrics that feed the adapter gate and mode bias
|
| 27 |
+
- `state_confidence_target`
|
| 28 |
+
|
| 29 |
+
This corrected artifact set is versioned as `smoke_v2`.
|
| 30 |
+
|
| 31 |
+
## Fixed Protocol
|
| 32 |
+
|
| 33 |
+
### Benchmark
|
| 34 |
+
|
| 35 |
+
- Public benchmark: ManiSkill `PickClutterYCB-v1`
|
| 36 |
+
- Track id: `occlusion_track`
|
| 37 |
+
- Task family label inside the adapter stack: `foliage`
|
| 38 |
+
- Resolution: `224`
|
| 39 |
+
- One seed for training: `17`
|
| 40 |
+
|
| 41 |
+
### Data
|
| 42 |
+
|
| 43 |
+
- One benchmark-native scripted macro teacher collects the dataset once.
|
| 44 |
+
- The teacher also writes per-step scene-state labels from the same public benchmark state and candidate sweep.
|
| 45 |
+
- Train demos: `32`
|
| 46 |
+
- Val demos: `8`
|
| 47 |
+
- Held-out eval episodes: `50`
|
| 48 |
+
- The exact train, val, and eval episode ids/seeds are frozen once generated and written to disk.
|
| 49 |
+
|
| 50 |
+
### Fairness Constraints
|
| 51 |
+
|
| 52 |
+
- Both trained conditions start from the same initialization checkpoint.
|
| 53 |
+
- Both use the same train/val split.
|
| 54 |
+
- Both use the same held-out eval episodes.
|
| 55 |
+
- Both use the same optimizer, batch size, LR, epoch budget, and random seed.
|
| 56 |
+
- Both fine-tune the same trunk submodules:
|
| 57 |
+
- fusion
|
| 58 |
+
- memory
|
| 59 |
+
- decoder
|
| 60 |
+
- The backbone stays frozen for both conditions.
|
| 61 |
+
- The only architectural difference is the presence of the structured adapter.
|
| 62 |
+
- `candidate0` remains the raw trunk action.
|
| 63 |
+
- `adapter_noop` is eval-only and is produced from the `adapter_active_ft` checkpoint.
|
| 64 |
+
|
| 65 |
+
### Initialization
|
| 66 |
+
|
| 67 |
+
- Shared init checkpoint:
|
| 68 |
+
- `/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt`
|
| 69 |
+
- Load with shape filtering / `init_strict: false`.
|
| 70 |
+
|
| 71 |
+
### Training Conditions
|
| 72 |
+
|
| 73 |
+
#### `trunk_only_ft`
|
| 74 |
+
|
| 75 |
+
- Policy type: `foundation_trunk`
|
| 76 |
+
- Trainable prefixes:
|
| 77 |
+
- `fusion`
|
| 78 |
+
- `memory`
|
| 79 |
+
- `decoder`
|
| 80 |
+
|
| 81 |
+
#### `adapter_active_ft`
|
| 82 |
+
|
| 83 |
+
- Policy type: `adapter_wrapped`
|
| 84 |
+
- Trainable prefixes:
|
| 85 |
+
- `trunk.fusion`
|
| 86 |
+
- `trunk.memory`
|
| 87 |
+
- `trunk.decoder`
|
| 88 |
+
- `adapter.state_head`
|
| 89 |
+
- `adapter.proposal_prior`
|
| 90 |
+
- `adapter.planner`
|
| 91 |
+
- Transition model: off for the smoke run
|
| 92 |
+
|
| 93 |
+
### Evaluation Conditions
|
| 94 |
+
|
| 95 |
+
- `trunk_only_ft`: trained trunk checkpoint
|
| 96 |
+
- `adapter_noop`: adapter checkpoint in no-op mode
|
| 97 |
+
- `adapter_active_ft`: adapter checkpoint in active mode
|
| 98 |
+
|
| 99 |
+
### Success Criteria
|
| 100 |
+
|
| 101 |
+
- Adapter success exceeds trunk-only success by at least `5` absolute points on the held-out `50` episodes.
|
| 102 |
+
- Adapter intervention rate is at least `15%`.
|
| 103 |
+
- Non-base selection rate is at least `15%`.
|
| 104 |
+
- Results are summarized through the public benchmark package reporter under the `occlusion_track`.
|
| 105 |
+
|
| 106 |
+
## Planned Artifacts
|
| 107 |
+
|
| 108 |
+
### Data
|
| 109 |
+
|
| 110 |
+
- `/workspace/workspace/data/maniskill_pickclutter/smoke_v2/train.pt`
|
| 111 |
+
- `/workspace/workspace/data/maniskill_pickclutter/smoke_v2/val.pt`
|
| 112 |
+
- `/workspace/workspace/data/maniskill_pickclutter/smoke_v2/episode_splits.json`
|
| 113 |
+
|
| 114 |
+
### Train Outputs
|
| 115 |
+
|
| 116 |
+
- `/workspace/workspace/outputs/maniskill_pickclutter_smoke_v2/trunk_only_ft_seed17/`
|
| 117 |
+
- `/workspace/workspace/outputs/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17/`
|
| 118 |
+
|
| 119 |
+
### Eval Outputs
|
| 120 |
+
|
| 121 |
+
- `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/trunk_only_ft_seed17.json`
|
| 122 |
+
- `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/adapter_noop_seed17.json`
|
| 123 |
+
- `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17.json`
|
| 124 |
+
|
| 125 |
+
### Package Summary
|
| 126 |
+
|
| 127 |
+
- `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.json`
|
| 128 |
+
- `/workspace/workspace/reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.md`
|
| 129 |
+
|
| 130 |
+
## Notes
|
| 131 |
+
|
| 132 |
+
- This run is intentionally limited to the fastest credible public target track.
|
| 133 |
+
- No custom benchmark or custom teleop suite is allowed for this smoke.
|
| 134 |
+
- If the ManiSkill runtime or macro controller requires repairs, the repairs must preserve the fairness constraints above.
|
docs/public_benchmark_progress_2026-04-01.md
ADDED
|
@@ -0,0 +1,91 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
## Public Benchmark Progress
|
| 2 |
+
|
| 3 |
+
Date: 2026-04-01 UTC
|
| 4 |
+
|
| 5 |
+
### Confirmed Real Public Benchmark Result
|
| 6 |
+
|
| 7 |
+
- Public occlusion proxy: `ManiSkill PickClutterYCB-v1`
|
| 8 |
+
- Strongest adapter-specific result so far:
|
| 9 |
+
- summary: `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
|
| 10 |
+
- `trunk_only_ft = 0.04`
|
| 11 |
+
- `adapter_noop = 0.04`
|
| 12 |
+
- `adapter_active_ft = 0.62`
|
| 13 |
+
- `delta_active_vs_trunk = +0.58`
|
| 14 |
+
- `95% CI = [0.44, 0.72]`
|
| 15 |
+
- `intervention_rate = 1.0`
|
| 16 |
+
- `non_base_selection_rate = 1.0`
|
| 17 |
+
- Interpretation:
|
| 18 |
+
- this is real adapter-specific sign of life on a public occlusion benchmark
|
| 19 |
+
- the gain is not coming from a stronger shared trunk, because `adapter_noop` stays flat
|
| 20 |
+
|
| 21 |
+
### BEHAVIOR Bag Proxy Investigation
|
| 22 |
+
|
| 23 |
+
Target public task family:
|
| 24 |
+
- official BEHAVIOR grocery-store bag/container retrieval proxy
|
| 25 |
+
- primary candidate: `paying_for_purchases`
|
| 26 |
+
- stricter but currently unusable candidate: `buy_basic_garden_tools`
|
| 27 |
+
|
| 28 |
+
Environment used:
|
| 29 |
+
- BEHAVIOR assets: `/workspace/workspace/BEHAVIOR-1K`
|
| 30 |
+
- venv used for probes: `/workspace/envs/behavior`
|
| 31 |
+
|
| 32 |
+
Findings:
|
| 33 |
+
- `buy_basic_garden_tools` is blocked by official scene-task geometry:
|
| 34 |
+
- repeated failure on `ontop ['rake.n.03_1', 'grocery_shelf.n.01_1']`
|
| 35 |
+
- even with whitelist attempts, the sampler never found a valid shelf placement
|
| 36 |
+
- `paying_for_purchases` is much healthier:
|
| 37 |
+
- `grocery_store_convenience`, `grocery_store_cafe`, and `grocery_store_asian` all load
|
| 38 |
+
- object scope binds the real task objects:
|
| 39 |
+
- `shopping_basket.n.01_1`
|
| 40 |
+
- `money.n.01_1`
|
| 41 |
+
- `checkout.n.03_1`
|
| 42 |
+
- `floor.n.01_1`
|
| 43 |
+
- Root sampler bug:
|
| 44 |
+
- official online sampling fails on the floor / agent chain
|
| 45 |
+
- without patching, the blocking warning is:
|
| 46 |
+
- `Room type [grocery_store] ... floor.n.01_1: , checkout.n.03_1: grocery_store_0`
|
| 47 |
+
- after removing the agent-on-floor condition from the sampler pipeline, the next blocker is:
|
| 48 |
+
- `ontop ['shopping_basket.n.01_1', 'floor.n.01_1'] False`
|
| 49 |
+
- Critical state-probe result:
|
| 50 |
+
- even when object bindings exist, the sampled movable objects remain parked at their far-away import positions
|
| 51 |
+
- observed example on `grocery_store_asian`:
|
| 52 |
+
- basket position near `[120, 120, -80]`
|
| 53 |
+
- money position near `[115, 115, -85]`
|
| 54 |
+
- apples position near `[110, 110, -90]` and `[105, 105, -95]`
|
| 55 |
+
- `money inside basket = False`
|
| 56 |
+
- `apple1 inside basket = False`
|
| 57 |
+
- `apple2 inside basket = False`
|
| 58 |
+
- Conclusion:
|
| 59 |
+
- as of 2026-04-01, the BEHAVIOR bag proxy is not yet a usable fair evaluation track in this workspace
|
| 60 |
+
- the public task objects bind, but the online sampler does not materialize a valid initial scene for training or evaluation
|
| 61 |
+
|
| 62 |
+
### Garment / Cloth Proxy Status
|
| 63 |
+
|
| 64 |
+
- GarmentLab repo cloned:
|
| 65 |
+
- `/workspace/workspace/GarmentLab`
|
| 66 |
+
- Immediate constraint:
|
| 67 |
+
- the repo expects Isaac Sim 4.0.0 plus external Google Drive assets
|
| 68 |
+
- Current status:
|
| 69 |
+
- code inspected only
|
| 70 |
+
- no runnable public cloth benchmark execution completed yet in this workspace
|
| 71 |
+
|
| 72 |
+
### Next Public Proxy Candidates
|
| 73 |
+
|
| 74 |
+
Given the BEHAVIOR blocker, the next-lightest public candidates already available locally are:
|
| 75 |
+
|
| 76 |
+
- `OpenCabinetDrawer-v1`
|
| 77 |
+
- public ManiSkill task
|
| 78 |
+
- good container reveal / access proxy
|
| 79 |
+
- `PutEggplantInBasketScene-v1`
|
| 80 |
+
- public ManiSkill bridge-dataset task
|
| 81 |
+
- public basket / container interaction proxy
|
| 82 |
+
- `PutSpoonOnTableClothInScene-v1`
|
| 83 |
+
- public ManiSkill bridge-dataset cloth interaction proxy
|
| 84 |
+
|
| 85 |
+
### Immediate Recommendation
|
| 86 |
+
|
| 87 |
+
- Keep the confirmed `PickClutterYCB-v1` result as the anchor public success case.
|
| 88 |
+
- Do not spend more time on BEHAVIOR online sampling until either:
|
| 89 |
+
- a cached valid scene instance is created, or
|
| 90 |
+
- the sampler is patched deeply enough to place container objects correctly instead of leaving them at far-away import positions.
|
| 91 |
+
- Pivot the next train/eval smoke to a lighter public ManiSkill proxy before returning to BEHAVIOR.
|
docs/public_bridge_smoke_run_log_2026-04-01.md
ADDED
|
@@ -0,0 +1,116 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Public Bridge Smoke Run Log
|
| 2 |
+
|
| 3 |
+
Date: 2026-04-01 UTC
|
| 4 |
+
|
| 5 |
+
## Completed public proxy evidence
|
| 6 |
+
|
| 7 |
+
- Occlusion proxy already completed earlier on `PickClutterYCB-v1`.
|
| 8 |
+
- Best current occlusion report:
|
| 9 |
+
- `/workspace/workspace/reports/maniskill_pickclutter_smoke_v5_eval_tuned_softerpref/public_benchmark_package_summary.json`
|
| 10 |
+
- `trunk_only_ft=0.04`
|
| 11 |
+
- `adapter_noop=0.04`
|
| 12 |
+
- `adapter_active_ft=0.62`
|
| 13 |
+
- `delta_active_vs_trunk=+0.58`
|
| 14 |
+
- `95% CI [0.44, 0.72]`
|
| 15 |
+
- `intervention_rate=1.0`
|
| 16 |
+
- `non_base_selection_rate=1.0`
|
| 17 |
+
|
| 18 |
+
- Bag proxy completed on the public ManiSkill bridge basket scene proxy.
|
| 19 |
+
- Bag report directory:
|
| 20 |
+
- `/workspace/workspace/reports/maniskill_bag_bridge_smoke_v1`
|
| 21 |
+
- Bag result summary:
|
| 22 |
+
- `trunk_only_ft=0.32`
|
| 23 |
+
- `adapter_noop=0.00`
|
| 24 |
+
- `adapter_active_ft=0.48`
|
| 25 |
+
- `delta_active_vs_trunk=+0.16`
|
| 26 |
+
- `delta_active_vs_trunk_ci95=[-0.04, 0.34]`
|
| 27 |
+
- `intervention_rate=1.0`
|
| 28 |
+
- `non_base_selection_rate=1.0`
|
| 29 |
+
- bag track `signs_of_life=true`
|
| 30 |
+
- package-level headline gate remains false at this single-seed smoke scale
|
| 31 |
+
|
| 32 |
+
## Cloth proxy definition
|
| 33 |
+
|
| 34 |
+
- Public scene proxy:
|
| 35 |
+
- `PutSpoonOnTableClothInScene-v1`
|
| 36 |
+
- Fixed hidden-state initialization:
|
| 37 |
+
- spoon pose `[-0.235, -0.094, 0.8748]`
|
| 38 |
+
- cloth pose `[-0.235, -0.075, 0.885]`
|
| 39 |
+
- Deterministic valid-seed filter:
|
| 40 |
+
- accept only seeds whose initialized hidden state is below the visibility gate and solvable by scripted reveal+retrieve
|
| 41 |
+
- Reveal macros corrected to push-style actions:
|
| 42 |
+
- `lift_edge` = front push in `+y`
|
| 43 |
+
- `separate_layer` = side push in `+x`
|
| 44 |
+
- Cloth success metric corrected:
|
| 45 |
+
- based on spoon displacement from its own hidden start plus visibility
|
| 46 |
+
- no longer credits success merely because the cloth flies away
|
| 47 |
+
|
| 48 |
+
## Important runner fixes already landed
|
| 49 |
+
|
| 50 |
+
- File:
|
| 51 |
+
- `/workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py`
|
| 52 |
+
- Fixed:
|
| 53 |
+
- cloth hidden-state initialization
|
| 54 |
+
- cloth seed filtering and split reuse via `episode_splits.json`
|
| 55 |
+
- `post_bundle` missing in cloth collect success check
|
| 56 |
+
- bridge smoke loss weights aligned to current `LossWeights`
|
| 57 |
+
- adapter trainable parameter prefixes aligned to working pickclutter runner
|
| 58 |
+
- zero-depth layout changed to channel-first
|
| 59 |
+
- cached dataset normalizer added for old channel-last depth tensors
|
| 60 |
+
|
| 61 |
+
## Live status when this note was written
|
| 62 |
+
|
| 63 |
+
- Bag process is complete.
|
| 64 |
+
- Cloth process is still collecting the train split in the original long-running session.
|
| 65 |
+
- The long-running cloth process was started before the later loss-weight and depth-layout fixes, so it is expected to finish collection and then crash at training start.
|
| 66 |
+
- After it writes `train.pt` and `val.pt`, restart cloth with:
|
| 67 |
+
|
| 68 |
+
```bash
|
| 69 |
+
python /workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py --task cloth --skip-collection
|
| 70 |
+
```
|
| 71 |
+
|
| 72 |
+
- If trunk checkpoint already exists by that point and only adapter needs rerun:
|
| 73 |
+
|
| 74 |
+
```bash
|
| 75 |
+
python /workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py --task cloth --skip-collection --reuse-checkpoints
|
| 76 |
+
```
|
| 77 |
+
|
| 78 |
+
## Cloth restart correction
|
| 79 |
+
|
| 80 |
+
- The corrected cloth restart reached adapter training and failed in rollout supervision because the cached cloth public proxy authored `7` candidate targets while the decoder always allocates `8` proposal slots.
|
| 81 |
+
- Fix landed in:
|
| 82 |
+
- `/workspace/workspace/VLAarchtests3_export/code/VLAarchtests2_code/VLAarchtests/code/reveal_vla_bimanual/eval/run_maniskill_bridge_retrieval_smoke.py`
|
| 83 |
+
- Correction:
|
| 84 |
+
- cached bridge samples now normalize channel-last depth tensors as before
|
| 85 |
+
- cached candidate-aligned tensors now also pad from `7 -> 8` slots before loading
|
| 86 |
+
- padding cycles the non-base candidates first, which preserves the collected cloth episodes and avoids recollection
|
| 87 |
+
- Verified locally before restart:
|
| 88 |
+
- normalized cloth `candidate_action_chunks` is `(8, 8, 14)`
|
| 89 |
+
- normalized cloth `candidate_rollout_support_mode` is `(8, 5)`
|
| 90 |
+
- one real `adapter_active_ft` training step and one real validation loss pass both completed without the previous shape error
|
| 91 |
+
|
| 92 |
+
## Cloth result
|
| 93 |
+
|
| 94 |
+
- Report directory:
|
| 95 |
+
- `/workspace/workspace/reports/maniskill_cloth_bridge_smoke_v1`
|
| 96 |
+
- Final cloth smoke summary:
|
| 97 |
+
- `trunk_only_ft = 0.04`
|
| 98 |
+
- `adapter_noop = 0.04`
|
| 99 |
+
- `adapter_active_ft = 0.10`
|
| 100 |
+
- `delta_active_vs_trunk = +0.06`
|
| 101 |
+
- `delta_active_vs_trunk_ci95 = [-0.04, 0.16]`
|
| 102 |
+
- `intervention_rate = 0.3369`
|
| 103 |
+
- `non_base_selection_rate = 0.2674`
|
| 104 |
+
- Interpretation:
|
| 105 |
+
- cloth proxy is positive and adapter-specific in this single-seed smoke because `adapter_noop` stayed flat while `adapter_active_ft` improved
|
| 106 |
+
- effect size is modest and not yet statistically clean in this smoke protocol
|
| 107 |
+
|
| 108 |
+
## Combined three-track proxy suite
|
| 109 |
+
|
| 110 |
+
- Combined report:
|
| 111 |
+
- `/workspace/workspace/reports/public_proxy_suite_smoke_v1/combined_summary.json`
|
| 112 |
+
- `/workspace/workspace/reports/public_proxy_suite_smoke_v1/combined_summary.md`
|
| 113 |
+
- Current three-track smoke evidence:
|
| 114 |
+
- occlusion proxy positive and adapter-specific
|
| 115 |
+
- bag proxy positive and adapter-specific
|
| 116 |
+
- cloth proxy positive and adapter-specific
|
reports/anchor_dual_push_smoke/original_trunk/rollout_eval.partial.json
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"checkpoint": "/workspace/workspace/VLAarchtests2/outputs/rlbench_dual_push/rlbench_dual_push_backbone_only_clip_chunk8_weighted_seed17/checkpoint_best.pt",
|
| 3 |
+
"plan_requested": false,
|
| 4 |
+
"plan_applied": false,
|
| 5 |
+
"planner_mode": "trainable",
|
| 6 |
+
"support_mode_conditioning": true,
|
| 7 |
+
"task_conditioning": true,
|
| 8 |
+
"geometry_enabled": true,
|
| 9 |
+
"world_model_mode": "checkpoint_default",
|
| 10 |
+
"episodes_per_task": 5,
|
| 11 |
+
"episode_length": 120,
|
| 12 |
+
"resolution": 256,
|
| 13 |
+
"reset_retries": 20,
|
| 14 |
+
"arm_mode": "planning",
|
| 15 |
+
"delta_scale": 1.0,
|
| 16 |
+
"cameras": [
|
| 17 |
+
"front",
|
| 18 |
+
"wrist_left",
|
| 19 |
+
"wrist_right"
|
| 20 |
+
],
|
| 21 |
+
"tasks": {
|
| 22 |
+
"bimanual_dual_push_buttons": {
|
| 23 |
+
"error": "The call failed on the V-REP side. Return value: -1",
|
| 24 |
+
"mean_success": 0.0,
|
| 25 |
+
"mean_return": 0.0
|
| 26 |
+
}
|
| 27 |
+
},
|
| 28 |
+
"mean_success": 0.0
|
| 29 |
+
}
|
reports/anybimanual_anchor_bridge_live/trunk_only_ep5/stderr.txt
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
/workspace/third_party/AnyBimanual/eval.py:183: UserWarning:
|
| 2 |
+
The version_base parameter is not specified.
|
| 3 |
+
Please specify a compatability version level, or None.
|
| 4 |
+
Will assume defaults for version 1.1
|
| 5 |
+
@hydra.main(config_name="eval", config_path="conf")
|
| 6 |
+
/workspace/envs/rlbench/lib/python3.10/site-packages/hydra/_internal/defaults_list.py:251: UserWarning: In 'eval': Defaults list is missing `_self_`. See https://hydra.cc/docs/1.2/upgrades/1.0_to_1.1/default_composition_order for more information
|
| 7 |
+
warnings.warn(msg, UserWarning)
|
| 8 |
+
/workspace/envs/rlbench/lib/python3.10/site-packages/hydra/core/default_element.py:124: UserWarning: In 'method/PERACT_BC': Usage of deprecated keyword in package header '# @package _group_'.
|
| 9 |
+
See https://hydra.cc/docs/1.2/upgrades/1.0_to_1.1/changes_to_package_header for more information
|
| 10 |
+
deprecation_warning(
|
| 11 |
+
/workspace/envs/rlbench/lib/python3.10/site-packages/hydra/_internal/hydra.py:119: UserWarning: Future Hydra versions will no longer change working directory at job runtime by default.
|
| 12 |
+
See https://hydra.cc/docs/1.2/upgrades/1.1_to_1.2/changes_to_job_working_dir/ for more information.
|
| 13 |
+
ret = run_job(
|
| 14 |
+
Error executing job with overrides: ['method=PERACT_BC', 'framework.logdir=/workspace/workspace/reports/anybimanual_anchor_bridge_live/trunk_only_ep5/anybimanual_logdir', 'framework.start_seed=0', 'framework.eval_type=60000', 'framework.eval_episodes=5', 'framework.eval_envs=1', 'framework.gpu=0', 'rlbench.task_name=perlf_release_dual_push_buttons_smoke5', 'rlbench.tasks=[dual_push_buttons]', 'rlbench.demo_path=/workspace/baselines/AnyBimanual_subset3_demo_root', 'rlbench.headless=True', 'rlbench.gripper_mode=BimanualDiscrete', 'rlbench.arm_action_mode=BimanualEndEffectorPoseViaPlanning', 'rlbench.action_mode=BimanualMoveArmThenGripper']
|
| 15 |
+
Traceback (most recent call last):
|
| 16 |
+
File "/workspace/third_party/AnyBimanual/eval.py", line 201, in main
|
| 17 |
+
raise Exception(f"Missing seed{start_seed}/config.yaml. Logdir is {logdir}")
|
| 18 |
+
Exception: Missing seed0/config.yaml. Logdir is /workspace/workspace/reports/anybimanual_anchor_bridge_live/trunk_only_ep5/anybimanual_logdir/perlf_release_dual_push_buttons_smoke5/PERACT_BC/seed0
|
| 19 |
+
|
| 20 |
+
Set the environment variable HYDRA_FULL_ERROR=1 for a complete stack trace.
|
reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_active_ft_seed23.json
ADDED
|
@@ -0,0 +1,131 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_active_ft",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
1,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.125,
|
| 19 |
+
"intervention_rate": 0.0,
|
| 20 |
+
"non_base_selection_rate": 0.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": true,
|
| 52 |
+
"steps": 1,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": false,
|
| 84 |
+
"steps": 4,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "adapter_active_ft",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
|
| 110 |
+
"train_spec": {
|
| 111 |
+
"track_id": "bag_track",
|
| 112 |
+
"suite": "maniskill3",
|
| 113 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 114 |
+
"model_variant": "adapter_active_ft",
|
| 115 |
+
"seed": 23,
|
| 116 |
+
"train_demos": 32,
|
| 117 |
+
"val_demos": 8,
|
| 118 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 119 |
+
"optimizer": "adamw",
|
| 120 |
+
"learning_rate": 0.0001,
|
| 121 |
+
"lr_schedule": "constant",
|
| 122 |
+
"batch_size": 4,
|
| 123 |
+
"augmentations": "none",
|
| 124 |
+
"early_stopping_metric": "val_total",
|
| 125 |
+
"max_gradient_steps": 114,
|
| 126 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 127 |
+
"dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
|
| 128 |
+
"same_data_policy": true,
|
| 129 |
+
"same_init_policy": true
|
| 130 |
+
}
|
| 131 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/conservative/adapter_noop_seed23.json
ADDED
|
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_noop",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
1,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.125,
|
| 19 |
+
"intervention_rate": 0.0,
|
| 20 |
+
"non_base_selection_rate": 0.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": true,
|
| 52 |
+
"steps": 1,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": false,
|
| 84 |
+
"steps": 4,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "adapter_noop",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone."
|
| 110 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/conservative/run.log
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 3 |
+
Key | Status | |
|
| 4 |
+
-------------------------------------+------------+--+-
|
| 5 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 6 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 7 |
+
|
| 8 |
+
Notes:
|
| 9 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 10 |
+
CLIPTextTransformer does not expose input embeddings. Gradients cannot flow back to the token embeddings when using adapters or gradient checkpointing. Override `get_input_embeddings` to fully support those features, or set `_input_embed_layer` to the attribute name that holds the embeddings.
|
| 11 |
+
/usr/local/lib/python3.11/dist-packages/torch/nn/modules/transformer.py:307: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.norm_first was True
|
| 12 |
+
warnings.warn(f"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}")
|
| 13 |
+
[33;1m2026-04-01 11:27:44,182 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 14 |
+
[33;1m2026-04-01 11:27:44,237 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 15 |
+
[33;1m2026-04-01 11:27:44,250 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 16 |
+
[33;1m2026-04-01 11:27:44,918 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 17 |
+
[33;1m2026-04-01 11:27:44,920 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 18 |
+
[33;1m2026-04-01 11:27:44,920 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 19 |
+
/usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: [33mWARN: env.get_obs to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_obs` for environment variables or `env.get_wrapper_attr('get_obs')` that will search the reminding wrappers.[0m
|
| 20 |
+
logger.warn(
|
| 21 |
+
/usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: [33mWARN: env.get_info to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_info` for environment variables or `env.get_wrapper_attr('get_info')` that will search the reminding wrappers.[0m
|
| 22 |
+
logger.warn(
|
| 23 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171000, "success": false, "steps": 4}
|
| 24 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171001, "success": false, "steps": 4}
|
| 25 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171002, "success": false, "steps": 4}
|
| 26 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171003, "success": false, "steps": 4}
|
| 27 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171004, "success": false, "steps": 4}
|
| 28 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171005, "success": false, "steps": 4}
|
| 29 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171006, "success": false, "steps": 4}
|
| 30 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171007, "success": true, "steps": 1}
|
| 31 |
+
|
| 32 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 33 |
+
Key | Status | |
|
| 34 |
+
-------------------------------------+------------+--+-
|
| 35 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 36 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 37 |
+
|
| 38 |
+
Notes:
|
| 39 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 40 |
+
[33;1m2026-04-01 11:28:17,937 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 41 |
+
[33;1m2026-04-01 11:28:17,940 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 42 |
+
[33;1m2026-04-01 11:28:17,940 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 43 |
+
[33;1m2026-04-01 11:28:18,161 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 44 |
+
[33;1m2026-04-01 11:28:18,164 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 45 |
+
[33;1m2026-04-01 11:28:18,164 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 46 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171000, "success": false, "steps": 4}
|
| 47 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171001, "success": false, "steps": 4}
|
| 48 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171002, "success": false, "steps": 4}
|
| 49 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171003, "success": true, "steps": 1}
|
| 50 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171004, "success": false, "steps": 4}
|
| 51 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171005, "success": false, "steps": 4}
|
| 52 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171006, "success": false, "steps": 4}
|
| 53 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171007, "success": false, "steps": 4}
|
| 54 |
+
|
| 55 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 56 |
+
Key | Status | |
|
| 57 |
+
-------------------------------------+------------+--+-
|
| 58 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 59 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 60 |
+
|
| 61 |
+
Notes:
|
| 62 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 63 |
+
[33;1m2026-04-01 11:28:46,030 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 64 |
+
[33;1m2026-04-01 11:28:46,032 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 65 |
+
[33;1m2026-04-01 11:28:46,033 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 66 |
+
[33;1m2026-04-01 11:28:46,254 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 67 |
+
[33;1m2026-04-01 11:28:46,257 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 68 |
+
[33;1m2026-04-01 11:28:46,257 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 69 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171000, "success": false, "steps": 4}
|
| 70 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171001, "success": false, "steps": 4}
|
| 71 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171002, "success": false, "steps": 4}
|
| 72 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171003, "success": true, "steps": 1}
|
| 73 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171004, "success": false, "steps": 4}
|
| 74 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171005, "success": false, "steps": 4}
|
| 75 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171006, "success": false, "steps": 4}
|
| 76 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171007, "success": false, "steps": 4}
|
reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_active_ft_seed23.json
ADDED
|
@@ -0,0 +1,131 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_active_ft",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.0,
|
| 19 |
+
"intervention_rate": 1.0,
|
| 20 |
+
"non_base_selection_rate": 1.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": false,
|
| 52 |
+
"steps": 4,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": false,
|
| 84 |
+
"steps": 4,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "adapter_active_ft",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
|
| 110 |
+
"train_spec": {
|
| 111 |
+
"track_id": "bag_track",
|
| 112 |
+
"suite": "maniskill3",
|
| 113 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 114 |
+
"model_variant": "adapter_active_ft",
|
| 115 |
+
"seed": 23,
|
| 116 |
+
"train_demos": 32,
|
| 117 |
+
"val_demos": 8,
|
| 118 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 119 |
+
"optimizer": "adamw",
|
| 120 |
+
"learning_rate": 0.0001,
|
| 121 |
+
"lr_schedule": "constant",
|
| 122 |
+
"batch_size": 4,
|
| 123 |
+
"augmentations": "none",
|
| 124 |
+
"early_stopping_metric": "val_total",
|
| 125 |
+
"max_gradient_steps": 114,
|
| 126 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 127 |
+
"dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
|
| 128 |
+
"same_data_policy": true,
|
| 129 |
+
"same_init_policy": true
|
| 130 |
+
}
|
| 131 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/default/adapter_noop_seed23.json
ADDED
|
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_noop",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
1,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.125,
|
| 19 |
+
"intervention_rate": 0.0,
|
| 20 |
+
"non_base_selection_rate": 0.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": true,
|
| 52 |
+
"steps": 1,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": false,
|
| 84 |
+
"steps": 4,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "adapter_noop",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone."
|
| 110 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.json
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"anchor_pass": true,
|
| 3 |
+
"available_tracks": [
|
| 4 |
+
"bag_track"
|
| 5 |
+
],
|
| 6 |
+
"ci_above_zero_tracks": [],
|
| 7 |
+
"headline_pass": false,
|
| 8 |
+
"package_name": "public_reveal_retrieve_package_v1",
|
| 9 |
+
"sign_of_life_pass": false,
|
| 10 |
+
"sign_of_life_track_count": 0,
|
| 11 |
+
"sign_of_life_tracks": [],
|
| 12 |
+
"target_macro_average_delta": -0.125,
|
| 13 |
+
"tracks": {
|
| 14 |
+
"bag_track": {
|
| 15 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 16 |
+
"delta_active_vs_trunk": -0.125,
|
| 17 |
+
"delta_active_vs_trunk_ci95": [
|
| 18 |
+
-0.375,
|
| 19 |
+
0.0
|
| 20 |
+
],
|
| 21 |
+
"delta_noop_vs_trunk": 0.0,
|
| 22 |
+
"modes": {
|
| 23 |
+
"adapter_active_ft": {
|
| 24 |
+
"disturbance_proxy": 0.0,
|
| 25 |
+
"intervention_rate": 1.0,
|
| 26 |
+
"mean_success": 0.0,
|
| 27 |
+
"non_base_selection_rate": 1.0,
|
| 28 |
+
"num_runs": 1,
|
| 29 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 30 |
+
"steps_to_retrieve": 4.0
|
| 31 |
+
},
|
| 32 |
+
"adapter_noop": {
|
| 33 |
+
"disturbance_proxy": 0.0,
|
| 34 |
+
"intervention_rate": 0.0,
|
| 35 |
+
"mean_success": 0.125,
|
| 36 |
+
"non_base_selection_rate": 0.0,
|
| 37 |
+
"num_runs": 1,
|
| 38 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 39 |
+
"steps_to_retrieve": 4.0
|
| 40 |
+
},
|
| 41 |
+
"trunk_only_ft": {
|
| 42 |
+
"disturbance_proxy": 0.0,
|
| 43 |
+
"intervention_rate": 0.0,
|
| 44 |
+
"mean_success": 0.125,
|
| 45 |
+
"non_base_selection_rate": 0.0,
|
| 46 |
+
"num_runs": 1,
|
| 47 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 48 |
+
"steps_to_retrieve": 4.0
|
| 49 |
+
}
|
| 50 |
+
},
|
| 51 |
+
"notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
|
| 52 |
+
"public_source": "ManiSkill public scene proxy: PutEggplantInBasketScene-v1",
|
| 53 |
+
"role": "target",
|
| 54 |
+
"signs_of_life": false,
|
| 55 |
+
"suite": "maniskill3",
|
| 56 |
+
"target_behavior": "retrieve the target object from inside the basket and stage it outside the basket",
|
| 57 |
+
"task_family": "bag_retrieval_proxy"
|
| 58 |
+
}
|
| 59 |
+
}
|
| 60 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/default/public_benchmark_package_summary.md
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# ManiSkill Bag Retrieval Smoke Summary
|
| 2 |
+
|
| 3 |
+
- benchmark_task: PutEggplantInBasketRetrievalProxy-v1
|
| 4 |
+
- target_macro_average_delta: -0.125
|
| 5 |
+
- headline_pass: False
|
| 6 |
+
- sign_of_life_pass: False
|
| 7 |
+
|
| 8 |
+
## bag_track
|
| 9 |
+
- delta_active_vs_trunk: -0.125
|
| 10 |
+
- delta_noop_vs_trunk: 0.000
|
| 11 |
+
- signs_of_life: False
|
| 12 |
+
- delta_active_vs_trunk_ci95: [-0.375, 0.000]
|
| 13 |
+
- trunk_only_ft: mean_success=0.125
|
| 14 |
+
- adapter_noop: mean_success=0.125
|
| 15 |
+
- adapter_active_ft: mean_success=0.000
|
reports/maniskill_bag_bridge_val_sweep_seed23/default/run.log
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 3 |
+
Key | Status | |
|
| 4 |
+
-------------------------------------+------------+--+-
|
| 5 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 6 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 7 |
+
|
| 8 |
+
Notes:
|
| 9 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 10 |
+
CLIPTextTransformer does not expose input embeddings. Gradients cannot flow back to the token embeddings when using adapters or gradient checkpointing. Override `get_input_embeddings` to fully support those features, or set `_input_embed_layer` to the attribute name that holds the embeddings.
|
| 11 |
+
/usr/local/lib/python3.11/dist-packages/torch/nn/modules/transformer.py:307: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.norm_first was True
|
| 12 |
+
warnings.warn(f"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}")
|
| 13 |
+
[33;1m2026-04-01 11:24:45,511 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 14 |
+
[33;1m2026-04-01 11:24:45,572 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 15 |
+
[33;1m2026-04-01 11:24:45,576 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 16 |
+
[33;1m2026-04-01 11:24:46,297 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 17 |
+
[33;1m2026-04-01 11:24:46,300 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 18 |
+
[33;1m2026-04-01 11:24:46,300 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 19 |
+
/usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: [33mWARN: env.get_obs to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_obs` for environment variables or `env.get_wrapper_attr('get_obs')` that will search the reminding wrappers.[0m
|
| 20 |
+
logger.warn(
|
| 21 |
+
/usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: [33mWARN: env.get_info to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_info` for environment variables or `env.get_wrapper_attr('get_info')` that will search the reminding wrappers.[0m
|
| 22 |
+
logger.warn(
|
| 23 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171000, "success": false, "steps": 4}
|
| 24 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171001, "success": false, "steps": 4}
|
| 25 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171002, "success": false, "steps": 4}
|
| 26 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171003, "success": false, "steps": 4}
|
| 27 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171004, "success": false, "steps": 4}
|
| 28 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171005, "success": false, "steps": 4}
|
| 29 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171006, "success": false, "steps": 4}
|
| 30 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171007, "success": true, "steps": 1}
|
| 31 |
+
|
| 32 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 33 |
+
Key | Status | |
|
| 34 |
+
-------------------------------------+------------+--+-
|
| 35 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 36 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 37 |
+
|
| 38 |
+
Notes:
|
| 39 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 40 |
+
[33;1m2026-04-01 11:25:18,652 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 41 |
+
[33;1m2026-04-01 11:25:18,655 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 42 |
+
[33;1m2026-04-01 11:25:18,655 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 43 |
+
[33;1m2026-04-01 11:25:18,873 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 44 |
+
[33;1m2026-04-01 11:25:18,875 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 45 |
+
[33;1m2026-04-01 11:25:18,875 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 46 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171000, "success": false, "steps": 4}
|
| 47 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171001, "success": false, "steps": 4}
|
| 48 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171002, "success": false, "steps": 4}
|
| 49 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171003, "success": true, "steps": 1}
|
| 50 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171004, "success": false, "steps": 4}
|
| 51 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171005, "success": false, "steps": 4}
|
| 52 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171006, "success": false, "steps": 4}
|
| 53 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171007, "success": false, "steps": 4}
|
| 54 |
+
|
| 55 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 56 |
+
Key | Status | |
|
| 57 |
+
-------------------------------------+------------+--+-
|
| 58 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 59 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 60 |
+
|
| 61 |
+
Notes:
|
| 62 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 63 |
+
[33;1m2026-04-01 11:25:46,337 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 64 |
+
[33;1m2026-04-01 11:25:46,339 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 65 |
+
[33;1m2026-04-01 11:25:46,339 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 66 |
+
[33;1m2026-04-01 11:25:46,556 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 67 |
+
[33;1m2026-04-01 11:25:46,558 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 68 |
+
[33;1m2026-04-01 11:25:46,559 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 69 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171000, "success": false, "steps": 4}
|
| 70 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171001, "success": false, "steps": 4}
|
| 71 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171002, "success": false, "steps": 4}
|
| 72 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171003, "success": false, "steps": 4}
|
| 73 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171004, "success": false, "steps": 4}
|
| 74 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171005, "success": false, "steps": 4}
|
| 75 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171006, "success": false, "steps": 4}
|
| 76 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171007, "success": false, "steps": 4}
|
reports/maniskill_bag_bridge_val_sweep_seed23/default/trunk_only_ft_seed23.json
ADDED
|
@@ -0,0 +1,131 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "trunk_only_ft",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
1
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.125,
|
| 19 |
+
"intervention_rate": 0.0,
|
| 20 |
+
"non_base_selection_rate": 0.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": false,
|
| 52 |
+
"steps": 4,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": true,
|
| 84 |
+
"steps": 1,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "trunk_only_ft",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
|
| 110 |
+
"train_spec": {
|
| 111 |
+
"track_id": "bag_track",
|
| 112 |
+
"suite": "maniskill3",
|
| 113 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 114 |
+
"model_variant": "trunk_only_ft",
|
| 115 |
+
"seed": 23,
|
| 116 |
+
"train_demos": 32,
|
| 117 |
+
"val_demos": 8,
|
| 118 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 119 |
+
"optimizer": "adamw",
|
| 120 |
+
"learning_rate": 0.0001,
|
| 121 |
+
"lr_schedule": "constant",
|
| 122 |
+
"batch_size": 4,
|
| 123 |
+
"augmentations": "none",
|
| 124 |
+
"early_stopping_metric": "val_total",
|
| 125 |
+
"max_gradient_steps": 114,
|
| 126 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 127 |
+
"dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
|
| 128 |
+
"same_data_policy": true,
|
| 129 |
+
"same_init_policy": true
|
| 130 |
+
}
|
| 131 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/public_benchmark_package_summary.md
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# ManiSkill Bag Retrieval Smoke Summary
|
| 2 |
+
|
| 3 |
+
- benchmark_task: PutEggplantInBasketRetrievalProxy-v1
|
| 4 |
+
- target_macro_average_delta: 0.000
|
| 5 |
+
- headline_pass: False
|
| 6 |
+
- sign_of_life_pass: False
|
| 7 |
+
|
| 8 |
+
## bag_track
|
| 9 |
+
- delta_active_vs_trunk: 0.000
|
| 10 |
+
- delta_noop_vs_trunk: 0.000
|
| 11 |
+
- signs_of_life: False
|
| 12 |
+
- delta_active_vs_trunk_ci95: [-0.375, 0.375]
|
| 13 |
+
- trunk_only_ft: mean_success=0.125
|
| 14 |
+
- adapter_noop: mean_success=0.125
|
| 15 |
+
- adapter_active_ft: mean_success=0.125
|
reports/maniskill_bag_bridge_val_sweep_seed23/less_bonus/trunk_only_ft_seed23.json
ADDED
|
@@ -0,0 +1,131 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "trunk_only_ft",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
1
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.125,
|
| 19 |
+
"intervention_rate": 0.0,
|
| 20 |
+
"non_base_selection_rate": 0.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": false,
|
| 52 |
+
"steps": 4,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": true,
|
| 84 |
+
"steps": 1,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "trunk_only_ft",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
|
| 110 |
+
"train_spec": {
|
| 111 |
+
"track_id": "bag_track",
|
| 112 |
+
"suite": "maniskill3",
|
| 113 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 114 |
+
"model_variant": "trunk_only_ft",
|
| 115 |
+
"seed": 23,
|
| 116 |
+
"train_demos": 32,
|
| 117 |
+
"val_demos": 8,
|
| 118 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 119 |
+
"optimizer": "adamw",
|
| 120 |
+
"learning_rate": 0.0001,
|
| 121 |
+
"lr_schedule": "constant",
|
| 122 |
+
"batch_size": 4,
|
| 123 |
+
"augmentations": "none",
|
| 124 |
+
"early_stopping_metric": "val_total",
|
| 125 |
+
"max_gradient_steps": 114,
|
| 126 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 127 |
+
"dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
|
| 128 |
+
"same_data_policy": true,
|
| 129 |
+
"same_init_policy": true
|
| 130 |
+
}
|
| 131 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/adapter_noop_seed23.json
ADDED
|
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_noop",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
1,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.125,
|
| 19 |
+
"intervention_rate": 0.0,
|
| 20 |
+
"non_base_selection_rate": 0.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": true,
|
| 52 |
+
"steps": 1,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": false,
|
| 84 |
+
"steps": 4,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "adapter_noop",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone."
|
| 110 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.json
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"anchor_pass": true,
|
| 3 |
+
"available_tracks": [
|
| 4 |
+
"bag_track"
|
| 5 |
+
],
|
| 6 |
+
"ci_above_zero_tracks": [],
|
| 7 |
+
"headline_pass": false,
|
| 8 |
+
"package_name": "public_reveal_retrieve_package_v1",
|
| 9 |
+
"sign_of_life_pass": false,
|
| 10 |
+
"sign_of_life_track_count": 0,
|
| 11 |
+
"sign_of_life_tracks": [],
|
| 12 |
+
"target_macro_average_delta": 0.0,
|
| 13 |
+
"tracks": {
|
| 14 |
+
"bag_track": {
|
| 15 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 16 |
+
"delta_active_vs_trunk": 0.0,
|
| 17 |
+
"delta_active_vs_trunk_ci95": [
|
| 18 |
+
-0.375,
|
| 19 |
+
0.375
|
| 20 |
+
],
|
| 21 |
+
"delta_noop_vs_trunk": 0.0,
|
| 22 |
+
"modes": {
|
| 23 |
+
"adapter_active_ft": {
|
| 24 |
+
"disturbance_proxy": 0.0,
|
| 25 |
+
"intervention_rate": 0.0,
|
| 26 |
+
"mean_success": 0.125,
|
| 27 |
+
"non_base_selection_rate": 0.0,
|
| 28 |
+
"num_runs": 1,
|
| 29 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 30 |
+
"steps_to_retrieve": 4.0
|
| 31 |
+
},
|
| 32 |
+
"adapter_noop": {
|
| 33 |
+
"disturbance_proxy": 0.0,
|
| 34 |
+
"intervention_rate": 0.0,
|
| 35 |
+
"mean_success": 0.125,
|
| 36 |
+
"non_base_selection_rate": 0.0,
|
| 37 |
+
"num_runs": 1,
|
| 38 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 39 |
+
"steps_to_retrieve": 4.0
|
| 40 |
+
},
|
| 41 |
+
"trunk_only_ft": {
|
| 42 |
+
"disturbance_proxy": 0.0,
|
| 43 |
+
"intervention_rate": 0.0,
|
| 44 |
+
"mean_success": 0.125,
|
| 45 |
+
"non_base_selection_rate": 0.0,
|
| 46 |
+
"num_runs": 1,
|
| 47 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 48 |
+
"steps_to_retrieve": 4.0
|
| 49 |
+
}
|
| 50 |
+
},
|
| 51 |
+
"notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
|
| 52 |
+
"public_source": "ManiSkill public scene proxy: PutEggplantInBasketScene-v1",
|
| 53 |
+
"role": "target",
|
| 54 |
+
"signs_of_life": false,
|
| 55 |
+
"suite": "maniskill3",
|
| 56 |
+
"target_behavior": "retrieve the target object from inside the basket and stage it outside the basket",
|
| 57 |
+
"task_family": "bag_retrieval_proxy"
|
| 58 |
+
}
|
| 59 |
+
}
|
| 60 |
+
}
|
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/public_benchmark_package_summary.md
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# ManiSkill Bag Retrieval Smoke Summary
|
| 2 |
+
|
| 3 |
+
- benchmark_task: PutEggplantInBasketRetrievalProxy-v1
|
| 4 |
+
- target_macro_average_delta: 0.000
|
| 5 |
+
- headline_pass: False
|
| 6 |
+
- sign_of_life_pass: False
|
| 7 |
+
|
| 8 |
+
## bag_track
|
| 9 |
+
- delta_active_vs_trunk: 0.000
|
| 10 |
+
- delta_noop_vs_trunk: 0.000
|
| 11 |
+
- signs_of_life: False
|
| 12 |
+
- delta_active_vs_trunk_ci95: [-0.375, 0.375]
|
| 13 |
+
- trunk_only_ft: mean_success=0.125
|
| 14 |
+
- adapter_noop: mean_success=0.125
|
| 15 |
+
- adapter_active_ft: mean_success=0.125
|
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/run.log
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 3 |
+
Key | Status | |
|
| 4 |
+
-------------------------------------+------------+--+-
|
| 5 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 6 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 7 |
+
|
| 8 |
+
Notes:
|
| 9 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 10 |
+
CLIPTextTransformer does not expose input embeddings. Gradients cannot flow back to the token embeddings when using adapters or gradient checkpointing. Override `get_input_embeddings` to fully support those features, or set `_input_embed_layer` to the attribute name that holds the embeddings.
|
| 11 |
+
/usr/local/lib/python3.11/dist-packages/torch/nn/modules/transformer.py:307: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.norm_first was True
|
| 12 |
+
warnings.warn(f"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}")
|
| 13 |
+
[33;1m2026-04-01 11:29:21,719 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 14 |
+
[33;1m2026-04-01 11:29:21,764 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 15 |
+
[33;1m2026-04-01 11:29:21,777 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 16 |
+
[33;1m2026-04-01 11:29:22,382 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 17 |
+
[33;1m2026-04-01 11:29:22,384 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 18 |
+
[33;1m2026-04-01 11:29:22,384 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 19 |
+
/usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: [33mWARN: env.get_obs to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_obs` for environment variables or `env.get_wrapper_attr('get_obs')` that will search the reminding wrappers.[0m
|
| 20 |
+
logger.warn(
|
| 21 |
+
/usr/local/lib/python3.11/dist-packages/gymnasium/core.py:311: UserWarning: [33mWARN: env.get_info to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.get_info` for environment variables or `env.get_wrapper_attr('get_info')` that will search the reminding wrappers.[0m
|
| 22 |
+
logger.warn(
|
| 23 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171000, "success": false, "steps": 4}
|
| 24 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171001, "success": false, "steps": 4}
|
| 25 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171002, "success": false, "steps": 4}
|
| 26 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171003, "success": false, "steps": 4}
|
| 27 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171004, "success": false, "steps": 4}
|
| 28 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171005, "success": false, "steps": 4}
|
| 29 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171006, "success": false, "steps": 4}
|
| 30 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "trunk_only_ft", "episode_seed": 171007, "success": true, "steps": 1}
|
| 31 |
+
|
| 32 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 33 |
+
Key | Status | |
|
| 34 |
+
-------------------------------------+------------+--+-
|
| 35 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 36 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 37 |
+
|
| 38 |
+
Notes:
|
| 39 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 40 |
+
[33;1m2026-04-01 11:29:55,476 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 41 |
+
[33;1m2026-04-01 11:29:55,480 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 42 |
+
[33;1m2026-04-01 11:29:55,480 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 43 |
+
[33;1m2026-04-01 11:29:55,702 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 44 |
+
[33;1m2026-04-01 11:29:55,705 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 45 |
+
[33;1m2026-04-01 11:29:55,705 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 46 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171000, "success": false, "steps": 4}
|
| 47 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171001, "success": false, "steps": 4}
|
| 48 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171002, "success": false, "steps": 4}
|
| 49 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171003, "success": true, "steps": 1}
|
| 50 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171004, "success": false, "steps": 4}
|
| 51 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171005, "success": false, "steps": 4}
|
| 52 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171006, "success": false, "steps": 4}
|
| 53 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_noop", "episode_seed": 171007, "success": false, "steps": 4}
|
| 54 |
+
|
| 55 |
+
[1mCLIPModel LOAD REPORT[0m from: openai/clip-vit-base-patch32
|
| 56 |
+
Key | Status | |
|
| 57 |
+
-------------------------------------+------------+--+-
|
| 58 |
+
vision_model.embeddings.position_ids | UNEXPECTED | |
|
| 59 |
+
text_model.embeddings.position_ids | UNEXPECTED | |
|
| 60 |
+
|
| 61 |
+
Notes:
|
| 62 |
+
- UNEXPECTED: can be ignored when loading from different task/architecture; not ok if you expect identical arch.
|
| 63 |
+
[33;1m2026-04-01 11:30:24,855 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 64 |
+
[33;1m2026-04-01 11:30:24,857 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 65 |
+
[33;1m2026-04-01 11:30:24,857 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 66 |
+
[33;1m2026-04-01 11:30:25,079 - mani_skill - WARNING - Mimic targets dictionary is missing for controller config for widowx250s_bridgedataset_sink. Assuming the first joint is the control joint and the second joint is the mimic joint[0m
|
| 67 |
+
[33;1m2026-04-01 11:30:25,081 - mani_skill - WARNING - No initial pose set for actor builder of eggplant, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 68 |
+
[33;1m2026-04-01 11:30:25,082 - mani_skill - WARNING - No initial pose set for actor builder of dummy_sink_target_plane, setting to default pose q=[1,0,0,0], p=[0,0,0]. Not setting reasonable initial poses may slow down simulation, see https://github.com/haosulab/ManiSkill/issues/421.[0m
|
| 69 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171000, "success": false, "steps": 4}
|
| 70 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171001, "success": false, "steps": 4}
|
| 71 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171002, "success": false, "steps": 4}
|
| 72 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171003, "success": true, "steps": 1}
|
| 73 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171004, "success": false, "steps": 4}
|
| 74 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171005, "success": false, "steps": 4}
|
| 75 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171006, "success": false, "steps": 4}
|
| 76 |
+
{"phase": "eval_episode_complete", "task": "bag", "adapter_mode": "adapter_active_ft", "episode_seed": 171007, "success": false, "steps": 4}
|
reports/maniskill_bag_bridge_val_sweep_seed23/low_bonus_high_thresh/trunk_only_ft_seed23.json
ADDED
|
@@ -0,0 +1,131 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "bag_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "trunk_only_ft",
|
| 7 |
+
"episodes": 8,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
1
|
| 17 |
+
],
|
| 18 |
+
"success_rate": 0.125,
|
| 19 |
+
"intervention_rate": 0.0,
|
| 20 |
+
"non_base_selection_rate": 0.0,
|
| 21 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 22 |
+
"steps_to_retrieve": 4.0,
|
| 23 |
+
"disturbance_proxy": 0.0,
|
| 24 |
+
"episode_records": [
|
| 25 |
+
{
|
| 26 |
+
"episode_seed": 171000,
|
| 27 |
+
"success": false,
|
| 28 |
+
"steps": 4,
|
| 29 |
+
"first_reveal_step": 1,
|
| 30 |
+
"first_retrieve_step": null,
|
| 31 |
+
"episode_disturbance": 0.0
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"episode_seed": 171001,
|
| 35 |
+
"success": false,
|
| 36 |
+
"steps": 4,
|
| 37 |
+
"first_reveal_step": 1,
|
| 38 |
+
"first_retrieve_step": null,
|
| 39 |
+
"episode_disturbance": 0.0
|
| 40 |
+
},
|
| 41 |
+
{
|
| 42 |
+
"episode_seed": 171002,
|
| 43 |
+
"success": false,
|
| 44 |
+
"steps": 4,
|
| 45 |
+
"first_reveal_step": 1,
|
| 46 |
+
"first_retrieve_step": null,
|
| 47 |
+
"episode_disturbance": 0.0
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"episode_seed": 171003,
|
| 51 |
+
"success": false,
|
| 52 |
+
"steps": 4,
|
| 53 |
+
"first_reveal_step": 1,
|
| 54 |
+
"first_retrieve_step": null,
|
| 55 |
+
"episode_disturbance": 0.0
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"episode_seed": 171004,
|
| 59 |
+
"success": false,
|
| 60 |
+
"steps": 4,
|
| 61 |
+
"first_reveal_step": 1,
|
| 62 |
+
"first_retrieve_step": null,
|
| 63 |
+
"episode_disturbance": 0.0
|
| 64 |
+
},
|
| 65 |
+
{
|
| 66 |
+
"episode_seed": 171005,
|
| 67 |
+
"success": false,
|
| 68 |
+
"steps": 4,
|
| 69 |
+
"first_reveal_step": 1,
|
| 70 |
+
"first_retrieve_step": null,
|
| 71 |
+
"episode_disturbance": 0.0
|
| 72 |
+
},
|
| 73 |
+
{
|
| 74 |
+
"episode_seed": 171006,
|
| 75 |
+
"success": false,
|
| 76 |
+
"steps": 4,
|
| 77 |
+
"first_reveal_step": 1,
|
| 78 |
+
"first_retrieve_step": null,
|
| 79 |
+
"episode_disturbance": 0.0
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"episode_seed": 171007,
|
| 83 |
+
"success": true,
|
| 84 |
+
"steps": 1,
|
| 85 |
+
"first_reveal_step": 1,
|
| 86 |
+
"first_retrieve_step": null,
|
| 87 |
+
"episode_disturbance": 0.0
|
| 88 |
+
}
|
| 89 |
+
],
|
| 90 |
+
"eval_protocol": {
|
| 91 |
+
"track_id": "bag_track",
|
| 92 |
+
"suite": "maniskill3",
|
| 93 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 94 |
+
"role": "target",
|
| 95 |
+
"eval_mode": "trunk_only_ft",
|
| 96 |
+
"seed": 17,
|
| 97 |
+
"episodes": 8,
|
| 98 |
+
"resolution": 224,
|
| 99 |
+
"cameras": [
|
| 100 |
+
"front",
|
| 101 |
+
"left",
|
| 102 |
+
"right"
|
| 103 |
+
],
|
| 104 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 105 |
+
"action_horizon": 8,
|
| 106 |
+
"action_space": "widowx_delta_pose",
|
| 107 |
+
"same_test_episodes": true
|
| 108 |
+
},
|
| 109 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The eggplant is placed inside the basket region and must be pulled back out to a staging zone.",
|
| 110 |
+
"train_spec": {
|
| 111 |
+
"track_id": "bag_track",
|
| 112 |
+
"suite": "maniskill3",
|
| 113 |
+
"benchmark_task": "PutEggplantInBasketRetrievalProxy-v1",
|
| 114 |
+
"model_variant": "trunk_only_ft",
|
| 115 |
+
"seed": 23,
|
| 116 |
+
"train_demos": 32,
|
| 117 |
+
"val_demos": 8,
|
| 118 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 119 |
+
"optimizer": "adamw",
|
| 120 |
+
"learning_rate": 0.0001,
|
| 121 |
+
"lr_schedule": "constant",
|
| 122 |
+
"batch_size": 4,
|
| 123 |
+
"augmentations": "none",
|
| 124 |
+
"early_stopping_metric": "val_total",
|
| 125 |
+
"max_gradient_steps": 114,
|
| 126 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 127 |
+
"dataset_split_id": "bag_bridge_smoke_v1_dataset_seed17",
|
| 128 |
+
"same_data_policy": true,
|
| 129 |
+
"same_init_policy": true
|
| 130 |
+
}
|
| 131 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed17.json
ADDED
|
@@ -0,0 +1,509 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_active_ft",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
1,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
1,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
1,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
0,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
1,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
1,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.1,
|
| 61 |
+
"intervention_rate": 0.33689839572192515,
|
| 62 |
+
"non_base_selection_rate": 0.26737967914438504,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1649820935726166,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.0
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": true,
|
| 78 |
+
"steps": 1,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 1.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.0
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.25
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.25
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.25
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.0
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.25
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": true,
|
| 198 |
+
"steps": 1,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 1.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.0
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.0
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.0
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": true,
|
| 238 |
+
"steps": 2,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.3782343992165157
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.25
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.25
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.16025998336928232
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": false,
|
| 302 |
+
"steps": 4,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.0
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.0
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.25
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.008142942828791497
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.0
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": true,
|
| 382 |
+
"steps": 1,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 1.0
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.0
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.10258094114916666
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.23011721244880132
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.18159967022282736
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.01112700679472516
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.1770425226007189
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.0
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.25
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": true,
|
| 454 |
+
"steps": 2,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.0
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.0
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_active_ft",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
|
| 488 |
+
"train_spec": {
|
| 489 |
+
"track_id": "cloth_track",
|
| 490 |
+
"suite": "maniskill3",
|
| 491 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 492 |
+
"model_variant": "adapter_active_ft",
|
| 493 |
+
"seed": 17,
|
| 494 |
+
"train_demos": 32,
|
| 495 |
+
"val_demos": 8,
|
| 496 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 497 |
+
"optimizer": "adamw",
|
| 498 |
+
"learning_rate": 0.0001,
|
| 499 |
+
"lr_schedule": "constant",
|
| 500 |
+
"batch_size": 4,
|
| 501 |
+
"augmentations": "none",
|
| 502 |
+
"early_stopping_metric": "val_total",
|
| 503 |
+
"max_gradient_steps": 174,
|
| 504 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 505 |
+
"dataset_split_id": "cloth_bridge_smoke_v1_seed17",
|
| 506 |
+
"same_data_policy": true,
|
| 507 |
+
"same_init_policy": true
|
| 508 |
+
}
|
| 509 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed23.json
ADDED
|
@@ -0,0 +1,509 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_active_ft",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
1,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
0,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.02,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.12309578397444318,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.25
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": false,
|
| 78 |
+
"steps": 4,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 0.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.12488718117986407
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.25
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.0
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.0
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.0
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.0
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.0
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.25
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.0
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.0
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.0
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": true,
|
| 238 |
+
"steps": 2,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.3782343992165157
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.25
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.25
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": false,
|
| 302 |
+
"steps": 4,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.25
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.25
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.25
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.046899239931787774
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.10476837839399065
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.0
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.0
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.25
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.0
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.25
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.25
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_active_ft",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
|
| 488 |
+
"train_spec": {
|
| 489 |
+
"track_id": "cloth_track",
|
| 490 |
+
"suite": "maniskill3",
|
| 491 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 492 |
+
"model_variant": "adapter_active_ft",
|
| 493 |
+
"seed": 23,
|
| 494 |
+
"train_demos": 32,
|
| 495 |
+
"val_demos": 8,
|
| 496 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 497 |
+
"optimizer": "adamw",
|
| 498 |
+
"learning_rate": 0.0001,
|
| 499 |
+
"lr_schedule": "constant",
|
| 500 |
+
"batch_size": 4,
|
| 501 |
+
"augmentations": "none",
|
| 502 |
+
"early_stopping_metric": "val_total",
|
| 503 |
+
"max_gradient_steps": 174,
|
| 504 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 505 |
+
"dataset_split_id": "cloth_bridge_smoke_v1_seed17",
|
| 506 |
+
"same_data_policy": true,
|
| 507 |
+
"same_init_policy": true
|
| 508 |
+
}
|
| 509 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/adapter_active_ft_seed29.json
ADDED
|
@@ -0,0 +1,509 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_active_ft",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
1,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
1,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.04,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.0
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": true,
|
| 78 |
+
"steps": 1,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 1.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.0
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.25
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.25
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.25
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.25
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.25
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.25
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.25
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.25
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.0
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.0
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": true,
|
| 302 |
+
"steps": 2,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.5
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.0
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.0
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.25
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.1429806500673294
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.25
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.0
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.25
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.0
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.0
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_active_ft",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
|
| 488 |
+
"train_spec": {
|
| 489 |
+
"track_id": "cloth_track",
|
| 490 |
+
"suite": "maniskill3",
|
| 491 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 492 |
+
"model_variant": "adapter_active_ft",
|
| 493 |
+
"seed": 29,
|
| 494 |
+
"train_demos": 32,
|
| 495 |
+
"val_demos": 8,
|
| 496 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 497 |
+
"optimizer": "adamw",
|
| 498 |
+
"learning_rate": 0.0001,
|
| 499 |
+
"lr_schedule": "constant",
|
| 500 |
+
"batch_size": 4,
|
| 501 |
+
"augmentations": "none",
|
| 502 |
+
"early_stopping_metric": "val_total",
|
| 503 |
+
"max_gradient_steps": 174,
|
| 504 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 505 |
+
"dataset_split_id": "cloth_bridge_smoke_v1_seed17",
|
| 506 |
+
"same_data_policy": true,
|
| 507 |
+
"same_init_policy": true
|
| 508 |
+
}
|
| 509 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed17.json
ADDED
|
@@ -0,0 +1,488 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_noop",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
1,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
1,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.04,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.0
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": true,
|
| 78 |
+
"steps": 1,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 1.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.0
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.25
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.25
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.25
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.25
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.25
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.25
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.25
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.25
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.0
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.0
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": true,
|
| 302 |
+
"steps": 2,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.5
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.0
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.0
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.25
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.1429806500673294
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.25
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.0
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.25
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.0
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.0
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_noop",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table."
|
| 488 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed23.json
ADDED
|
@@ -0,0 +1,488 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_noop",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
1,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
0,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.02,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.12309578397444318,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.25
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": false,
|
| 78 |
+
"steps": 4,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 0.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.12488718117986407
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.25
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.0
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.0
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.0
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.0
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.0
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.25
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.0
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.0
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.0
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": true,
|
| 238 |
+
"steps": 2,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.3782343992165157
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.25
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.25
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": false,
|
| 302 |
+
"steps": 4,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.25
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.25
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.25
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.046899239931787774
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.10476837839399065
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.0
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.0
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.25
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.0
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.25
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.25
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_noop",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table."
|
| 488 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/adapter_noop_seed29.json
ADDED
|
@@ -0,0 +1,488 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_noop",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
1,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
1,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.04,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.0
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": true,
|
| 78 |
+
"steps": 1,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 1.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.0
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.25
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.25
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.25
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.25
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.25
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.25
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.25
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.25
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.0
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.0
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": true,
|
| 302 |
+
"steps": 2,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.5
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.0
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.0
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.25
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.1429806500673294
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.25
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.0
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.25
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.0
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.0
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_noop",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table."
|
| 488 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.json
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"anchor_pass": true,
|
| 3 |
+
"available_tracks": [
|
| 4 |
+
"cloth_track"
|
| 5 |
+
],
|
| 6 |
+
"ci_above_zero_tracks": [],
|
| 7 |
+
"headline_pass": false,
|
| 8 |
+
"package_name": "public_reveal_retrieve_package_v1",
|
| 9 |
+
"sign_of_life_pass": false,
|
| 10 |
+
"sign_of_life_track_count": 0,
|
| 11 |
+
"sign_of_life_tracks": [],
|
| 12 |
+
"target_macro_average_delta": 0.0,
|
| 13 |
+
"tracks": {
|
| 14 |
+
"cloth_track": {
|
| 15 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 16 |
+
"delta_active_vs_trunk": 0.0,
|
| 17 |
+
"delta_active_vs_trunk_ci95": [
|
| 18 |
+
-0.07999999821186066,
|
| 19 |
+
0.07999999821186066
|
| 20 |
+
],
|
| 21 |
+
"delta_noop_vs_trunk": 0.0,
|
| 22 |
+
"modes": {
|
| 23 |
+
"adapter_active_ft": {
|
| 24 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 25 |
+
"intervention_rate": 0.0,
|
| 26 |
+
"mean_success": 0.03999999910593033,
|
| 27 |
+
"non_base_selection_rate": 0.0,
|
| 28 |
+
"num_runs": 1,
|
| 29 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 30 |
+
"steps_to_retrieve": 4.0
|
| 31 |
+
},
|
| 32 |
+
"adapter_noop": {
|
| 33 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 34 |
+
"intervention_rate": 0.0,
|
| 35 |
+
"mean_success": 0.03999999910593033,
|
| 36 |
+
"non_base_selection_rate": 0.0,
|
| 37 |
+
"num_runs": 1,
|
| 38 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 39 |
+
"steps_to_retrieve": 4.0
|
| 40 |
+
},
|
| 41 |
+
"trunk_only_ft": {
|
| 42 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 43 |
+
"intervention_rate": 0.0,
|
| 44 |
+
"mean_success": 0.03999999910593033,
|
| 45 |
+
"non_base_selection_rate": 0.0,
|
| 46 |
+
"num_runs": 1,
|
| 47 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 48 |
+
"steps_to_retrieve": 4.0
|
| 49 |
+
}
|
| 50 |
+
},
|
| 51 |
+
"notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
|
| 52 |
+
"public_source": "ManiSkill public scene proxy: PutSpoonOnTableClothInScene-v1",
|
| 53 |
+
"role": "target",
|
| 54 |
+
"signs_of_life": false,
|
| 55 |
+
"suite": "maniskill3",
|
| 56 |
+
"target_behavior": "reveal the spoon from under the cloth and retrieve it to the open area",
|
| 57 |
+
"task_family": "cloth_retrieval_proxy"
|
| 58 |
+
}
|
| 59 |
+
}
|
| 60 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/public_benchmark_package_summary.md
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# ManiSkill Cloth Retrieval Smoke Summary
|
| 2 |
+
|
| 3 |
+
- benchmark_task: PutSpoonUnderClothRetrievalProxy-v1
|
| 4 |
+
- target_macro_average_delta: 0.000
|
| 5 |
+
- headline_pass: False
|
| 6 |
+
- sign_of_life_pass: False
|
| 7 |
+
|
| 8 |
+
## cloth_track
|
| 9 |
+
- delta_active_vs_trunk: 0.000
|
| 10 |
+
- delta_noop_vs_trunk: 0.000
|
| 11 |
+
- signs_of_life: False
|
| 12 |
+
- delta_active_vs_trunk_ci95: [-0.080, 0.080]
|
| 13 |
+
- trunk_only_ft: mean_success=0.040
|
| 14 |
+
- adapter_noop: mean_success=0.040
|
| 15 |
+
- adapter_active_ft: mean_success=0.040
|
reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed17.json
ADDED
|
@@ -0,0 +1,509 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "trunk_only_ft",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
1,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
1,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.04,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.0
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": true,
|
| 78 |
+
"steps": 1,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 1.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.0
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.25
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.25
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.25
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.25
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.25
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.25
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.25
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.25
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.0
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.0
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": true,
|
| 302 |
+
"steps": 2,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.5
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.0
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.0
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.25
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.1429806500673294
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.25
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.0
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.25
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.0
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.0
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "trunk_only_ft",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
|
| 488 |
+
"train_spec": {
|
| 489 |
+
"track_id": "cloth_track",
|
| 490 |
+
"suite": "maniskill3",
|
| 491 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 492 |
+
"model_variant": "trunk_only_ft",
|
| 493 |
+
"seed": 17,
|
| 494 |
+
"train_demos": 32,
|
| 495 |
+
"val_demos": 8,
|
| 496 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 497 |
+
"optimizer": "adamw",
|
| 498 |
+
"learning_rate": 0.0001,
|
| 499 |
+
"lr_schedule": "constant",
|
| 500 |
+
"batch_size": 4,
|
| 501 |
+
"augmentations": "none",
|
| 502 |
+
"early_stopping_metric": "val_total",
|
| 503 |
+
"max_gradient_steps": 174,
|
| 504 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 505 |
+
"dataset_split_id": "cloth_bridge_smoke_v1_seed17",
|
| 506 |
+
"same_data_policy": true,
|
| 507 |
+
"same_init_policy": true
|
| 508 |
+
}
|
| 509 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed23.json
ADDED
|
@@ -0,0 +1,509 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "trunk_only_ft",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
1,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
1,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.04,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.0
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": true,
|
| 78 |
+
"steps": 1,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 1.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.0
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.25
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.25
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.25
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.25
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.25
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.25
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.25
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.25
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.0
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.0
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": true,
|
| 302 |
+
"steps": 2,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.5
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.0
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.0
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.25
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.1429806500673294
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.25
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.0
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.25
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.0
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.0
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "trunk_only_ft",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
|
| 488 |
+
"train_spec": {
|
| 489 |
+
"track_id": "cloth_track",
|
| 490 |
+
"suite": "maniskill3",
|
| 491 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 492 |
+
"model_variant": "trunk_only_ft",
|
| 493 |
+
"seed": 23,
|
| 494 |
+
"train_demos": 32,
|
| 495 |
+
"val_demos": 8,
|
| 496 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 497 |
+
"optimizer": "adamw",
|
| 498 |
+
"learning_rate": 0.0001,
|
| 499 |
+
"lr_schedule": "constant",
|
| 500 |
+
"batch_size": 4,
|
| 501 |
+
"augmentations": "none",
|
| 502 |
+
"early_stopping_metric": "val_total",
|
| 503 |
+
"max_gradient_steps": 174,
|
| 504 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 505 |
+
"dataset_split_id": "cloth_bridge_smoke_v1_seed17",
|
| 506 |
+
"same_data_policy": true,
|
| 507 |
+
"same_init_policy": true
|
| 508 |
+
}
|
| 509 |
+
}
|
reports/maniskill_cloth_bridge_smoke_v1/trunk_only_ft_seed29.json
ADDED
|
@@ -0,0 +1,509 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "cloth_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "trunk_only_ft",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
1,
|
| 11 |
+
0,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
0,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
0,
|
| 26 |
+
0,
|
| 27 |
+
0,
|
| 28 |
+
0,
|
| 29 |
+
0,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
0,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
1,
|
| 39 |
+
0,
|
| 40 |
+
0,
|
| 41 |
+
0,
|
| 42 |
+
0,
|
| 43 |
+
0,
|
| 44 |
+
0,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
0,
|
| 48 |
+
0,
|
| 49 |
+
0,
|
| 50 |
+
0,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
0,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
0
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.04,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1478596130013466,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 170104,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.0
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 170105,
|
| 77 |
+
"success": true,
|
| 78 |
+
"steps": 1,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 1.0
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 170106,
|
| 85 |
+
"success": false,
|
| 86 |
+
"steps": 4,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.25
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 170107,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 0.0
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 170109,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.25
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 170113,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 170117,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.25
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 170121,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.25
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 170124,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.25
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 170125,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.0
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 170129,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.0
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 170131,
|
| 157 |
+
"success": false,
|
| 158 |
+
"steps": 4,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.0
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 170137,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.25
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 170138,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.25
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 170139,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.25
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 170140,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.25
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 170145,
|
| 197 |
+
"success": false,
|
| 198 |
+
"steps": 4,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 0.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 170150,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.25
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 170151,
|
| 213 |
+
"success": false,
|
| 214 |
+
"steps": 4,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 0.0
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 170153,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 170154,
|
| 229 |
+
"success": false,
|
| 230 |
+
"steps": 4,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.25
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 170155,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.25
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 170166,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.0
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 170171,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.25
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 170173,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.0
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 170175,
|
| 269 |
+
"success": false,
|
| 270 |
+
"steps": 4,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.0
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 170177,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.0
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 170180,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.25
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 170181,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.25
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 170184,
|
| 301 |
+
"success": true,
|
| 302 |
+
"steps": 2,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 0.5
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 170185,
|
| 309 |
+
"success": false,
|
| 310 |
+
"steps": 4,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.25
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 170186,
|
| 317 |
+
"success": false,
|
| 318 |
+
"steps": 4,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.0
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 170198,
|
| 325 |
+
"success": false,
|
| 326 |
+
"steps": 4,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.0
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 170200,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.0
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 170205,
|
| 341 |
+
"success": false,
|
| 342 |
+
"steps": 4,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.0
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 170207,
|
| 349 |
+
"success": false,
|
| 350 |
+
"steps": 4,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.25
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 170208,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.25
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 170212,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.25
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 170214,
|
| 373 |
+
"success": false,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.0
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 170217,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 170223,
|
| 389 |
+
"success": false,
|
| 390 |
+
"steps": 4,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.1429806500673294
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 170226,
|
| 397 |
+
"success": false,
|
| 398 |
+
"steps": 4,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.25
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 170228,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.0
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 170229,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 170234,
|
| 421 |
+
"success": false,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 170237,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.0
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 170239,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.25
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 170241,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.0
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 170242,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.0
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 170243,
|
| 461 |
+
"success": false,
|
| 462 |
+
"steps": 4,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.25
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "cloth_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "trunk_only_ft",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgb_triplicate_zero_depth",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "widowx_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"proxy_notes": "Public ManiSkill bridge scene with custom retrieval initialization. The spoon is placed under the cloth region and must be revealed and extracted to the open side of the table.",
|
| 488 |
+
"train_spec": {
|
| 489 |
+
"track_id": "cloth_track",
|
| 490 |
+
"suite": "maniskill3",
|
| 491 |
+
"benchmark_task": "PutSpoonUnderClothRetrievalProxy-v1",
|
| 492 |
+
"model_variant": "trunk_only_ft",
|
| 493 |
+
"seed": 29,
|
| 494 |
+
"train_demos": 32,
|
| 495 |
+
"val_demos": 8,
|
| 496 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 497 |
+
"optimizer": "adamw",
|
| 498 |
+
"learning_rate": 0.0001,
|
| 499 |
+
"lr_schedule": "constant",
|
| 500 |
+
"batch_size": 4,
|
| 501 |
+
"augmentations": "none",
|
| 502 |
+
"early_stopping_metric": "val_total",
|
| 503 |
+
"max_gradient_steps": 174,
|
| 504 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 505 |
+
"dataset_split_id": "cloth_bridge_smoke_v1_seed17",
|
| 506 |
+
"same_data_policy": true,
|
| 507 |
+
"same_init_policy": true
|
| 508 |
+
}
|
| 509 |
+
}
|
reports/maniskill_pickclutter_smoke_v2/adapter_active_ft_seed17.json
ADDED
|
@@ -0,0 +1,508 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "occlusion_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_active_ft",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
1,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
1,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
1,
|
| 26 |
+
0,
|
| 27 |
+
1,
|
| 28 |
+
0,
|
| 29 |
+
1,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
1,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
0,
|
| 39 |
+
1,
|
| 40 |
+
1,
|
| 41 |
+
1,
|
| 42 |
+
0,
|
| 43 |
+
1,
|
| 44 |
+
1,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
1,
|
| 48 |
+
0,
|
| 49 |
+
1,
|
| 50 |
+
1,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
1,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
1
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.32,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1261227352138143,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 172000,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.11835007230072728
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 172001,
|
| 77 |
+
"success": false,
|
| 78 |
+
"steps": 4,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 0.16761024718687167
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 172002,
|
| 85 |
+
"success": true,
|
| 86 |
+
"steps": 1,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.0019509782725606326
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 172003,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 7.148081446217702e-05
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 172004,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.1784248970780015
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 172005,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.09801531238412764
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 172006,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.0005962321008468051
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 172007,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.1259510057686978
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 172008,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.11488150802027317
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 172009,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.04447960518379812
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 172010,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.28255011429793786
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 172011,
|
| 157 |
+
"success": true,
|
| 158 |
+
"steps": 3,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.04106344052554118
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 172012,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.07076599070619194
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 172013,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.13973692647627903
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 172014,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.004788672381939665
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 172015,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.28083725664289716
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 172016,
|
| 197 |
+
"success": true,
|
| 198 |
+
"steps": 1,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 1.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 172017,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.1641496366673234
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 172018,
|
| 213 |
+
"success": true,
|
| 214 |
+
"steps": 1,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 4.383633944371468e-05
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 172019,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25721585358608956
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 172020,
|
| 229 |
+
"success": true,
|
| 230 |
+
"steps": 3,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.17401533717143602
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 172021,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.006582688272562364
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 172022,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.061462426746240105
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 172023,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.26208380581626045
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 172024,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.17481319658276814
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 172025,
|
| 269 |
+
"success": true,
|
| 270 |
+
"steps": 2,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.011393342883305735
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 172026,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.040603790066086276
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 172027,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.001898237613124465
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 172028,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.1535773960429528
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 172029,
|
| 301 |
+
"success": false,
|
| 302 |
+
"steps": 4,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 2.6297170183653403e-05
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 172030,
|
| 309 |
+
"success": true,
|
| 310 |
+
"steps": 3,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.23568911686727625
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 172031,
|
| 317 |
+
"success": true,
|
| 318 |
+
"steps": 2,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.05458565396336822
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 172032,
|
| 325 |
+
"success": true,
|
| 326 |
+
"steps": 2,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.23615429148293285
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 172033,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.3794685144275167
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 172034,
|
| 341 |
+
"success": true,
|
| 342 |
+
"steps": 2,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.23963101771263
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 172035,
|
| 349 |
+
"success": true,
|
| 350 |
+
"steps": 3,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.1458236509853299
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 172036,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.0005504064674610731
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 172037,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.02395525002599186
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 172038,
|
| 373 |
+
"success": true,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.002132451383634048
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 172039,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0008329380843482188
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 172040,
|
| 389 |
+
"success": true,
|
| 390 |
+
"steps": 2,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.06136600544187113
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 172041,
|
| 397 |
+
"success": true,
|
| 398 |
+
"steps": 1,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.1345306197528089
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 172042,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.15628500139711843
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 172043,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0589350413731123
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 172044,
|
| 421 |
+
"success": true,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0012772400607863332
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 172045,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.014964900854341323
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 172046,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.00010739007165527781
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 172047,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.3118926811146435
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 172048,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.09965736700647154
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 172049,
|
| 461 |
+
"success": true,
|
| 462 |
+
"steps": 3,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.17035763711848637
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "occlusion_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_active_ft",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgbd_3cam",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "bimanual_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"train_spec": {
|
| 488 |
+
"track_id": "occlusion_track",
|
| 489 |
+
"suite": "maniskill3",
|
| 490 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 491 |
+
"model_variant": "adapter_active_ft",
|
| 492 |
+
"seed": 17,
|
| 493 |
+
"train_demos": 32,
|
| 494 |
+
"val_demos": 8,
|
| 495 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 496 |
+
"optimizer": "adamw",
|
| 497 |
+
"learning_rate": 0.0001,
|
| 498 |
+
"lr_schedule": "constant",
|
| 499 |
+
"batch_size": 4,
|
| 500 |
+
"augmentations": "none",
|
| 501 |
+
"early_stopping_metric": "val_total",
|
| 502 |
+
"max_gradient_steps": 144,
|
| 503 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 504 |
+
"dataset_split_id": "pickclutter_smoke_v2_seed17",
|
| 505 |
+
"same_data_policy": true,
|
| 506 |
+
"same_init_policy": true
|
| 507 |
+
}
|
| 508 |
+
}
|
reports/maniskill_pickclutter_smoke_v2/adapter_noop_seed17.json
ADDED
|
@@ -0,0 +1,508 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"track_id": "occlusion_track",
|
| 3 |
+
"suite": "maniskill3",
|
| 4 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 5 |
+
"role": "target",
|
| 6 |
+
"adapter_mode": "adapter_noop",
|
| 7 |
+
"episodes": 50,
|
| 8 |
+
"successes": [
|
| 9 |
+
0,
|
| 10 |
+
0,
|
| 11 |
+
1,
|
| 12 |
+
0,
|
| 13 |
+
0,
|
| 14 |
+
0,
|
| 15 |
+
0,
|
| 16 |
+
0,
|
| 17 |
+
0,
|
| 18 |
+
0,
|
| 19 |
+
0,
|
| 20 |
+
1,
|
| 21 |
+
0,
|
| 22 |
+
0,
|
| 23 |
+
0,
|
| 24 |
+
0,
|
| 25 |
+
1,
|
| 26 |
+
0,
|
| 27 |
+
1,
|
| 28 |
+
0,
|
| 29 |
+
1,
|
| 30 |
+
0,
|
| 31 |
+
0,
|
| 32 |
+
0,
|
| 33 |
+
0,
|
| 34 |
+
1,
|
| 35 |
+
0,
|
| 36 |
+
0,
|
| 37 |
+
0,
|
| 38 |
+
0,
|
| 39 |
+
1,
|
| 40 |
+
1,
|
| 41 |
+
1,
|
| 42 |
+
0,
|
| 43 |
+
1,
|
| 44 |
+
1,
|
| 45 |
+
0,
|
| 46 |
+
0,
|
| 47 |
+
1,
|
| 48 |
+
0,
|
| 49 |
+
1,
|
| 50 |
+
1,
|
| 51 |
+
0,
|
| 52 |
+
0,
|
| 53 |
+
1,
|
| 54 |
+
0,
|
| 55 |
+
0,
|
| 56 |
+
0,
|
| 57 |
+
0,
|
| 58 |
+
1
|
| 59 |
+
],
|
| 60 |
+
"success_rate": 0.32,
|
| 61 |
+
"intervention_rate": 0.0,
|
| 62 |
+
"non_base_selection_rate": 0.0,
|
| 63 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 64 |
+
"steps_to_retrieve": 4.0,
|
| 65 |
+
"disturbance_proxy": 0.1261227352138143,
|
| 66 |
+
"episode_records": [
|
| 67 |
+
{
|
| 68 |
+
"episode_seed": 172000,
|
| 69 |
+
"success": false,
|
| 70 |
+
"steps": 4,
|
| 71 |
+
"first_reveal_step": 1,
|
| 72 |
+
"first_retrieve_step": null,
|
| 73 |
+
"episode_disturbance": 0.11835007230072728
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"episode_seed": 172001,
|
| 77 |
+
"success": false,
|
| 78 |
+
"steps": 4,
|
| 79 |
+
"first_reveal_step": 1,
|
| 80 |
+
"first_retrieve_step": null,
|
| 81 |
+
"episode_disturbance": 0.16761024718687167
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"episode_seed": 172002,
|
| 85 |
+
"success": true,
|
| 86 |
+
"steps": 1,
|
| 87 |
+
"first_reveal_step": 1,
|
| 88 |
+
"first_retrieve_step": null,
|
| 89 |
+
"episode_disturbance": 0.0019509782725606326
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"episode_seed": 172003,
|
| 93 |
+
"success": false,
|
| 94 |
+
"steps": 4,
|
| 95 |
+
"first_reveal_step": 1,
|
| 96 |
+
"first_retrieve_step": null,
|
| 97 |
+
"episode_disturbance": 7.148081446217702e-05
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"episode_seed": 172004,
|
| 101 |
+
"success": false,
|
| 102 |
+
"steps": 4,
|
| 103 |
+
"first_reveal_step": 1,
|
| 104 |
+
"first_retrieve_step": null,
|
| 105 |
+
"episode_disturbance": 0.1784248970780015
|
| 106 |
+
},
|
| 107 |
+
{
|
| 108 |
+
"episode_seed": 172005,
|
| 109 |
+
"success": false,
|
| 110 |
+
"steps": 4,
|
| 111 |
+
"first_reveal_step": 1,
|
| 112 |
+
"first_retrieve_step": null,
|
| 113 |
+
"episode_disturbance": 0.09801531238412764
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"episode_seed": 172006,
|
| 117 |
+
"success": false,
|
| 118 |
+
"steps": 4,
|
| 119 |
+
"first_reveal_step": 1,
|
| 120 |
+
"first_retrieve_step": null,
|
| 121 |
+
"episode_disturbance": 0.0005962321008468051
|
| 122 |
+
},
|
| 123 |
+
{
|
| 124 |
+
"episode_seed": 172007,
|
| 125 |
+
"success": false,
|
| 126 |
+
"steps": 4,
|
| 127 |
+
"first_reveal_step": 1,
|
| 128 |
+
"first_retrieve_step": null,
|
| 129 |
+
"episode_disturbance": 0.1259510057686978
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"episode_seed": 172008,
|
| 133 |
+
"success": false,
|
| 134 |
+
"steps": 4,
|
| 135 |
+
"first_reveal_step": 1,
|
| 136 |
+
"first_retrieve_step": null,
|
| 137 |
+
"episode_disturbance": 0.11488150802027317
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"episode_seed": 172009,
|
| 141 |
+
"success": false,
|
| 142 |
+
"steps": 4,
|
| 143 |
+
"first_reveal_step": 1,
|
| 144 |
+
"first_retrieve_step": null,
|
| 145 |
+
"episode_disturbance": 0.04447960518379812
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"episode_seed": 172010,
|
| 149 |
+
"success": false,
|
| 150 |
+
"steps": 4,
|
| 151 |
+
"first_reveal_step": 1,
|
| 152 |
+
"first_retrieve_step": null,
|
| 153 |
+
"episode_disturbance": 0.28255011429793786
|
| 154 |
+
},
|
| 155 |
+
{
|
| 156 |
+
"episode_seed": 172011,
|
| 157 |
+
"success": true,
|
| 158 |
+
"steps": 3,
|
| 159 |
+
"first_reveal_step": 1,
|
| 160 |
+
"first_retrieve_step": null,
|
| 161 |
+
"episode_disturbance": 0.04106344052554118
|
| 162 |
+
},
|
| 163 |
+
{
|
| 164 |
+
"episode_seed": 172012,
|
| 165 |
+
"success": false,
|
| 166 |
+
"steps": 4,
|
| 167 |
+
"first_reveal_step": 1,
|
| 168 |
+
"first_retrieve_step": null,
|
| 169 |
+
"episode_disturbance": 0.07076599070619194
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"episode_seed": 172013,
|
| 173 |
+
"success": false,
|
| 174 |
+
"steps": 4,
|
| 175 |
+
"first_reveal_step": 1,
|
| 176 |
+
"first_retrieve_step": null,
|
| 177 |
+
"episode_disturbance": 0.13973692647627903
|
| 178 |
+
},
|
| 179 |
+
{
|
| 180 |
+
"episode_seed": 172014,
|
| 181 |
+
"success": false,
|
| 182 |
+
"steps": 4,
|
| 183 |
+
"first_reveal_step": 1,
|
| 184 |
+
"first_retrieve_step": null,
|
| 185 |
+
"episode_disturbance": 0.004788672381939665
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"episode_seed": 172015,
|
| 189 |
+
"success": false,
|
| 190 |
+
"steps": 4,
|
| 191 |
+
"first_reveal_step": 1,
|
| 192 |
+
"first_retrieve_step": null,
|
| 193 |
+
"episode_disturbance": 0.28083725664289716
|
| 194 |
+
},
|
| 195 |
+
{
|
| 196 |
+
"episode_seed": 172016,
|
| 197 |
+
"success": true,
|
| 198 |
+
"steps": 1,
|
| 199 |
+
"first_reveal_step": 1,
|
| 200 |
+
"first_retrieve_step": null,
|
| 201 |
+
"episode_disturbance": 1.0
|
| 202 |
+
},
|
| 203 |
+
{
|
| 204 |
+
"episode_seed": 172017,
|
| 205 |
+
"success": false,
|
| 206 |
+
"steps": 4,
|
| 207 |
+
"first_reveal_step": 1,
|
| 208 |
+
"first_retrieve_step": null,
|
| 209 |
+
"episode_disturbance": 0.1641496366673234
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"episode_seed": 172018,
|
| 213 |
+
"success": true,
|
| 214 |
+
"steps": 1,
|
| 215 |
+
"first_reveal_step": 1,
|
| 216 |
+
"first_retrieve_step": null,
|
| 217 |
+
"episode_disturbance": 4.383633944371468e-05
|
| 218 |
+
},
|
| 219 |
+
{
|
| 220 |
+
"episode_seed": 172019,
|
| 221 |
+
"success": false,
|
| 222 |
+
"steps": 4,
|
| 223 |
+
"first_reveal_step": 1,
|
| 224 |
+
"first_retrieve_step": null,
|
| 225 |
+
"episode_disturbance": 0.25721585358608956
|
| 226 |
+
},
|
| 227 |
+
{
|
| 228 |
+
"episode_seed": 172020,
|
| 229 |
+
"success": true,
|
| 230 |
+
"steps": 3,
|
| 231 |
+
"first_reveal_step": 1,
|
| 232 |
+
"first_retrieve_step": null,
|
| 233 |
+
"episode_disturbance": 0.17401533717143602
|
| 234 |
+
},
|
| 235 |
+
{
|
| 236 |
+
"episode_seed": 172021,
|
| 237 |
+
"success": false,
|
| 238 |
+
"steps": 4,
|
| 239 |
+
"first_reveal_step": 1,
|
| 240 |
+
"first_retrieve_step": null,
|
| 241 |
+
"episode_disturbance": 0.006582688272562364
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"episode_seed": 172022,
|
| 245 |
+
"success": false,
|
| 246 |
+
"steps": 4,
|
| 247 |
+
"first_reveal_step": 1,
|
| 248 |
+
"first_retrieve_step": null,
|
| 249 |
+
"episode_disturbance": 0.061462426746240105
|
| 250 |
+
},
|
| 251 |
+
{
|
| 252 |
+
"episode_seed": 172023,
|
| 253 |
+
"success": false,
|
| 254 |
+
"steps": 4,
|
| 255 |
+
"first_reveal_step": 1,
|
| 256 |
+
"first_retrieve_step": null,
|
| 257 |
+
"episode_disturbance": 0.26208380581626045
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"episode_seed": 172024,
|
| 261 |
+
"success": false,
|
| 262 |
+
"steps": 4,
|
| 263 |
+
"first_reveal_step": 1,
|
| 264 |
+
"first_retrieve_step": null,
|
| 265 |
+
"episode_disturbance": 0.17481319658276814
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"episode_seed": 172025,
|
| 269 |
+
"success": true,
|
| 270 |
+
"steps": 2,
|
| 271 |
+
"first_reveal_step": 1,
|
| 272 |
+
"first_retrieve_step": null,
|
| 273 |
+
"episode_disturbance": 0.011393342883305735
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"episode_seed": 172026,
|
| 277 |
+
"success": false,
|
| 278 |
+
"steps": 4,
|
| 279 |
+
"first_reveal_step": 1,
|
| 280 |
+
"first_retrieve_step": null,
|
| 281 |
+
"episode_disturbance": 0.040603790066086276
|
| 282 |
+
},
|
| 283 |
+
{
|
| 284 |
+
"episode_seed": 172027,
|
| 285 |
+
"success": false,
|
| 286 |
+
"steps": 4,
|
| 287 |
+
"first_reveal_step": 1,
|
| 288 |
+
"first_retrieve_step": null,
|
| 289 |
+
"episode_disturbance": 0.001898237613124465
|
| 290 |
+
},
|
| 291 |
+
{
|
| 292 |
+
"episode_seed": 172028,
|
| 293 |
+
"success": false,
|
| 294 |
+
"steps": 4,
|
| 295 |
+
"first_reveal_step": 1,
|
| 296 |
+
"first_retrieve_step": null,
|
| 297 |
+
"episode_disturbance": 0.1535773960429528
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"episode_seed": 172029,
|
| 301 |
+
"success": false,
|
| 302 |
+
"steps": 4,
|
| 303 |
+
"first_reveal_step": 1,
|
| 304 |
+
"first_retrieve_step": null,
|
| 305 |
+
"episode_disturbance": 2.6297170183653403e-05
|
| 306 |
+
},
|
| 307 |
+
{
|
| 308 |
+
"episode_seed": 172030,
|
| 309 |
+
"success": true,
|
| 310 |
+
"steps": 3,
|
| 311 |
+
"first_reveal_step": 1,
|
| 312 |
+
"first_retrieve_step": null,
|
| 313 |
+
"episode_disturbance": 0.23568911686727625
|
| 314 |
+
},
|
| 315 |
+
{
|
| 316 |
+
"episode_seed": 172031,
|
| 317 |
+
"success": true,
|
| 318 |
+
"steps": 2,
|
| 319 |
+
"first_reveal_step": 1,
|
| 320 |
+
"first_retrieve_step": null,
|
| 321 |
+
"episode_disturbance": 0.05458565396336822
|
| 322 |
+
},
|
| 323 |
+
{
|
| 324 |
+
"episode_seed": 172032,
|
| 325 |
+
"success": true,
|
| 326 |
+
"steps": 2,
|
| 327 |
+
"first_reveal_step": 1,
|
| 328 |
+
"first_retrieve_step": null,
|
| 329 |
+
"episode_disturbance": 0.23615429148293285
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"episode_seed": 172033,
|
| 333 |
+
"success": false,
|
| 334 |
+
"steps": 4,
|
| 335 |
+
"first_reveal_step": 1,
|
| 336 |
+
"first_retrieve_step": null,
|
| 337 |
+
"episode_disturbance": 0.3794685144275167
|
| 338 |
+
},
|
| 339 |
+
{
|
| 340 |
+
"episode_seed": 172034,
|
| 341 |
+
"success": true,
|
| 342 |
+
"steps": 2,
|
| 343 |
+
"first_reveal_step": 1,
|
| 344 |
+
"first_retrieve_step": null,
|
| 345 |
+
"episode_disturbance": 0.23963101771263
|
| 346 |
+
},
|
| 347 |
+
{
|
| 348 |
+
"episode_seed": 172035,
|
| 349 |
+
"success": true,
|
| 350 |
+
"steps": 3,
|
| 351 |
+
"first_reveal_step": 1,
|
| 352 |
+
"first_retrieve_step": null,
|
| 353 |
+
"episode_disturbance": 0.1458236509853299
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"episode_seed": 172036,
|
| 357 |
+
"success": false,
|
| 358 |
+
"steps": 4,
|
| 359 |
+
"first_reveal_step": 1,
|
| 360 |
+
"first_retrieve_step": null,
|
| 361 |
+
"episode_disturbance": 0.0005504064674610731
|
| 362 |
+
},
|
| 363 |
+
{
|
| 364 |
+
"episode_seed": 172037,
|
| 365 |
+
"success": false,
|
| 366 |
+
"steps": 4,
|
| 367 |
+
"first_reveal_step": 1,
|
| 368 |
+
"first_retrieve_step": null,
|
| 369 |
+
"episode_disturbance": 0.02395525002599186
|
| 370 |
+
},
|
| 371 |
+
{
|
| 372 |
+
"episode_seed": 172038,
|
| 373 |
+
"success": true,
|
| 374 |
+
"steps": 4,
|
| 375 |
+
"first_reveal_step": 1,
|
| 376 |
+
"first_retrieve_step": null,
|
| 377 |
+
"episode_disturbance": 0.002132451383634048
|
| 378 |
+
},
|
| 379 |
+
{
|
| 380 |
+
"episode_seed": 172039,
|
| 381 |
+
"success": false,
|
| 382 |
+
"steps": 4,
|
| 383 |
+
"first_reveal_step": 1,
|
| 384 |
+
"first_retrieve_step": null,
|
| 385 |
+
"episode_disturbance": 0.0008329380843482188
|
| 386 |
+
},
|
| 387 |
+
{
|
| 388 |
+
"episode_seed": 172040,
|
| 389 |
+
"success": true,
|
| 390 |
+
"steps": 2,
|
| 391 |
+
"first_reveal_step": 1,
|
| 392 |
+
"first_retrieve_step": null,
|
| 393 |
+
"episode_disturbance": 0.06136600544187113
|
| 394 |
+
},
|
| 395 |
+
{
|
| 396 |
+
"episode_seed": 172041,
|
| 397 |
+
"success": true,
|
| 398 |
+
"steps": 1,
|
| 399 |
+
"first_reveal_step": 1,
|
| 400 |
+
"first_retrieve_step": null,
|
| 401 |
+
"episode_disturbance": 0.1345306197528089
|
| 402 |
+
},
|
| 403 |
+
{
|
| 404 |
+
"episode_seed": 172042,
|
| 405 |
+
"success": false,
|
| 406 |
+
"steps": 4,
|
| 407 |
+
"first_reveal_step": 1,
|
| 408 |
+
"first_retrieve_step": null,
|
| 409 |
+
"episode_disturbance": 0.15628500139711843
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"episode_seed": 172043,
|
| 413 |
+
"success": false,
|
| 414 |
+
"steps": 4,
|
| 415 |
+
"first_reveal_step": 1,
|
| 416 |
+
"first_retrieve_step": null,
|
| 417 |
+
"episode_disturbance": 0.0589350413731123
|
| 418 |
+
},
|
| 419 |
+
{
|
| 420 |
+
"episode_seed": 172044,
|
| 421 |
+
"success": true,
|
| 422 |
+
"steps": 4,
|
| 423 |
+
"first_reveal_step": 1,
|
| 424 |
+
"first_retrieve_step": null,
|
| 425 |
+
"episode_disturbance": 0.0012772400607863332
|
| 426 |
+
},
|
| 427 |
+
{
|
| 428 |
+
"episode_seed": 172045,
|
| 429 |
+
"success": false,
|
| 430 |
+
"steps": 4,
|
| 431 |
+
"first_reveal_step": 1,
|
| 432 |
+
"first_retrieve_step": null,
|
| 433 |
+
"episode_disturbance": 0.014964900854341323
|
| 434 |
+
},
|
| 435 |
+
{
|
| 436 |
+
"episode_seed": 172046,
|
| 437 |
+
"success": false,
|
| 438 |
+
"steps": 4,
|
| 439 |
+
"first_reveal_step": 1,
|
| 440 |
+
"first_retrieve_step": null,
|
| 441 |
+
"episode_disturbance": 0.00010739007165527781
|
| 442 |
+
},
|
| 443 |
+
{
|
| 444 |
+
"episode_seed": 172047,
|
| 445 |
+
"success": false,
|
| 446 |
+
"steps": 4,
|
| 447 |
+
"first_reveal_step": 1,
|
| 448 |
+
"first_retrieve_step": null,
|
| 449 |
+
"episode_disturbance": 0.3118926811146435
|
| 450 |
+
},
|
| 451 |
+
{
|
| 452 |
+
"episode_seed": 172048,
|
| 453 |
+
"success": false,
|
| 454 |
+
"steps": 4,
|
| 455 |
+
"first_reveal_step": 1,
|
| 456 |
+
"first_retrieve_step": null,
|
| 457 |
+
"episode_disturbance": 0.09965736700647154
|
| 458 |
+
},
|
| 459 |
+
{
|
| 460 |
+
"episode_seed": 172049,
|
| 461 |
+
"success": true,
|
| 462 |
+
"steps": 3,
|
| 463 |
+
"first_reveal_step": 1,
|
| 464 |
+
"first_retrieve_step": null,
|
| 465 |
+
"episode_disturbance": 0.17035763711848637
|
| 466 |
+
}
|
| 467 |
+
],
|
| 468 |
+
"eval_protocol": {
|
| 469 |
+
"track_id": "occlusion_track",
|
| 470 |
+
"suite": "maniskill3",
|
| 471 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 472 |
+
"role": "target",
|
| 473 |
+
"eval_mode": "adapter_noop",
|
| 474 |
+
"seed": 17,
|
| 475 |
+
"episodes": 50,
|
| 476 |
+
"resolution": 224,
|
| 477 |
+
"cameras": [
|
| 478 |
+
"front",
|
| 479 |
+
"left",
|
| 480 |
+
"right"
|
| 481 |
+
],
|
| 482 |
+
"observation_stack": "rgbd_3cam",
|
| 483 |
+
"action_horizon": 8,
|
| 484 |
+
"action_space": "bimanual_delta_pose",
|
| 485 |
+
"same_test_episodes": true
|
| 486 |
+
},
|
| 487 |
+
"train_spec": {
|
| 488 |
+
"track_id": "occlusion_track",
|
| 489 |
+
"suite": "maniskill3",
|
| 490 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 491 |
+
"model_variant": "adapter_active_ft",
|
| 492 |
+
"seed": 17,
|
| 493 |
+
"train_demos": 32,
|
| 494 |
+
"val_demos": 8,
|
| 495 |
+
"init_checkpoint_group": "/workspace/workspace/VLAarchtests2/VLAarchtests/artifacts/outputs/r3d_handoff_phase/proxy_interaction_r3d_stage3_clip_rgbd_handoff_compact_phase_seed17/checkpoint_best.pt",
|
| 496 |
+
"optimizer": "adamw",
|
| 497 |
+
"learning_rate": 0.0001,
|
| 498 |
+
"lr_schedule": "constant",
|
| 499 |
+
"batch_size": 4,
|
| 500 |
+
"augmentations": "none",
|
| 501 |
+
"early_stopping_metric": "val_total",
|
| 502 |
+
"max_gradient_steps": 144,
|
| 503 |
+
"unfreeze_scope": "fusion_memory_decoder",
|
| 504 |
+
"dataset_split_id": "pickclutter_smoke_v2_seed17",
|
| 505 |
+
"same_data_policy": true,
|
| 506 |
+
"same_init_policy": true
|
| 507 |
+
}
|
| 508 |
+
}
|
reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.json
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"anchor_pass": true,
|
| 3 |
+
"available_tracks": [
|
| 4 |
+
"occlusion_track"
|
| 5 |
+
],
|
| 6 |
+
"ci_above_zero_tracks": [
|
| 7 |
+
"occlusion_track"
|
| 8 |
+
],
|
| 9 |
+
"headline_pass": true,
|
| 10 |
+
"package_name": "public_reveal_retrieve_package_v1",
|
| 11 |
+
"sign_of_life_pass": false,
|
| 12 |
+
"sign_of_life_track_count": 0,
|
| 13 |
+
"sign_of_life_tracks": [],
|
| 14 |
+
"target_macro_average_delta": 0.2799999937415123,
|
| 15 |
+
"tracks": {
|
| 16 |
+
"occlusion_track": {
|
| 17 |
+
"benchmark_task": "PickClutterYCB-v1",
|
| 18 |
+
"delta_active_vs_trunk": 0.2799999937415123,
|
| 19 |
+
"delta_active_vs_trunk_ci95": [
|
| 20 |
+
0.14000000059604645,
|
| 21 |
+
0.42050001621246064
|
| 22 |
+
],
|
| 23 |
+
"delta_noop_vs_trunk": 0.2799999937415123,
|
| 24 |
+
"modes": {
|
| 25 |
+
"adapter_active_ft": {
|
| 26 |
+
"disturbance_proxy": 0.1261227352138143,
|
| 27 |
+
"intervention_rate": 0.0,
|
| 28 |
+
"mean_success": 0.3199999928474426,
|
| 29 |
+
"non_base_selection_rate": 0.0,
|
| 30 |
+
"num_runs": 1,
|
| 31 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 32 |
+
"steps_to_retrieve": 4.0
|
| 33 |
+
},
|
| 34 |
+
"adapter_noop": {
|
| 35 |
+
"disturbance_proxy": 0.1261227352138143,
|
| 36 |
+
"intervention_rate": 0.0,
|
| 37 |
+
"mean_success": 0.3199999928474426,
|
| 38 |
+
"non_base_selection_rate": 0.0,
|
| 39 |
+
"num_runs": 1,
|
| 40 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 41 |
+
"steps_to_retrieve": 4.0
|
| 42 |
+
},
|
| 43 |
+
"trunk_only_ft": {
|
| 44 |
+
"disturbance_proxy": 0.22772394362117063,
|
| 45 |
+
"intervention_rate": 0.0,
|
| 46 |
+
"mean_success": 0.03999999910593033,
|
| 47 |
+
"non_base_selection_rate": 0.0,
|
| 48 |
+
"num_runs": 1,
|
| 49 |
+
"steps_to_first_reveal_or_access": 1.0,
|
| 50 |
+
"steps_to_retrieve": 4.0
|
| 51 |
+
}
|
| 52 |
+
},
|
| 53 |
+
"notes": "Closest maintained public occluded retrieval task. Treat as the canopy / dense occlusion proxy.",
|
| 54 |
+
"public_source": "https://maniskill.readthedocs.io/en/latest/tasks/table_top_gripper/index.html",
|
| 55 |
+
"role": "target",
|
| 56 |
+
"signs_of_life": false,
|
| 57 |
+
"suite": "maniskill3",
|
| 58 |
+
"target_behavior": "retrieve a target object from dense occluding clutter",
|
| 59 |
+
"task_family": "dense_occluded_retrieval"
|
| 60 |
+
}
|
| 61 |
+
}
|
| 62 |
+
}
|
reports/maniskill_pickclutter_smoke_v2/public_benchmark_package_summary.md
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# ManiSkill PickClutter Smoke Summary
|
| 2 |
+
|
| 3 |
+
- available_tracks: ['occlusion_track']
|
| 4 |
+
- target_macro_average_delta: 0.280
|
| 5 |
+
- headline_pass: True
|
| 6 |
+
- sign_of_life_pass: False
|
| 7 |
+
|
| 8 |
+
## occlusion_track
|
| 9 |
+
- delta_active_vs_trunk: 0.280
|
| 10 |
+
- delta_noop_vs_trunk: 0.280
|
| 11 |
+
- signs_of_life: False
|
| 12 |
+
- trunk_only_ft: mean_success=0.040
|
| 13 |
+
- adapter_noop: mean_success=0.320
|
| 14 |
+
- adapter_active_ft: mean_success=0.320
|