Upload checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins
Browse files
checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/wandb/offline-run-20260128_052914-vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins-run0/files/output.log
CHANGED
|
@@ -184,13 +184,6 @@ Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_ma
|
|
| 184 |
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 185 |
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 186 |
ce_avg: 0.0, mse_avg: 0.007629983127117157
|
| 187 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step1000
|
| 188 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 189 |
-
[eval debug] first 3 batch fingerprints:
|
| 190 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 191 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 192 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 193 |
-
ce_avg: 0.0, mse_avg: 0.007755194790661335
|
| 194 |
wandb: Detected [huggingface_hub.inference] in use.
|
| 195 |
wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
|
| 196 |
wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
|
|
@@ -1235,20 +1228,6 @@ wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
|
|
| 1235 |
[[34m2026-01-28 07:27:28[39m] (step=0001031) Train Loss mse: 0.0077, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1236 |
[[34m2026-01-28 07:27:34[39m] (step=0001032) Train Loss mse: 0.0074, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1237 |
[[34m2026-01-28 07:27:40[39m] (step=0001033) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 1238 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step1500
|
| 1239 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 1240 |
-
[eval debug] first 3 batch fingerprints:
|
| 1241 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1242 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1243 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1244 |
-
ce_avg: 0.0, mse_avg: 0.00788091029971838
|
| 1245 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step2000
|
| 1246 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 1247 |
-
[eval debug] first 3 batch fingerprints:
|
| 1248 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1249 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1250 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1251 |
-
ce_avg: 0.0, mse_avg: 0.008042296394705772
|
| 1252 |
[[34m2026-01-28 07:27:47[39m] (step=0001034) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1253 |
[[34m2026-01-28 07:27:53[39m] (step=0001035) Train Loss mse: 0.0087, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1254 |
[[34m2026-01-28 07:28:00[39m] (step=0001036) Train Loss mse: 0.0074, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
@@ -1268,6 +1247,27 @@ ce_avg: 0.0, mse_avg: 0.008042296394705772
|
|
| 1268 |
[[34m2026-01-28 07:29:29[39m] (step=0001050) Train Loss mse: 0.0083, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 1269 |
[[34m2026-01-28 07:29:36[39m] (step=0001051) Train Loss mse: 0.0079, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 1270 |
[[34m2026-01-28 07:29:42[39m] (step=0001052) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1271 |
[[34m2026-01-28 07:29:49[39m] (step=0001053) Train Loss mse: 0.0081, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1272 |
[[34m2026-01-28 07:29:55[39m] (step=0001054) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1273 |
[[34m2026-01-28 07:30:01[39m] (step=0001055) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
@@ -2645,6 +2645,20 @@ ce_avg: 0.0, mse_avg: 0.008042296394705772
|
|
| 2645 |
[[34m2026-01-28 09:58:23[39m] (step=0002427) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2646 |
[[34m2026-01-28 09:58:30[39m] (step=0002428) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2647 |
[[34m2026-01-28 09:58:36[39m] (step=0002429) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2648 |
[[34m2026-01-28 09:58:42[39m] (step=0002430) Train Loss mse: 0.0063, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2649 |
[[34m2026-01-28 09:58:49[39m] (step=0002431) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2650 |
[[34m2026-01-28 09:58:56[39m] (step=0002432) Train Loss mse: 0.0072, Train Loss ce: 0.0000, Train Steps/Sec: 0.14,
|
|
@@ -2681,27 +2695,6 @@ ce_avg: 0.0, mse_avg: 0.008042296394705772
|
|
| 2681 |
[[34m2026-01-28 10:02:15[39m] (step=0002463) Train Loss mse: 0.0075, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2682 |
[[34m2026-01-28 10:02:22[39m] (step=0002464) Train Loss mse: 0.0084, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2683 |
[[34m2026-01-28 10:02:28[39m] (step=0002465) Train Loss mse: 0.0072, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2684 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step2500
|
| 2685 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 2686 |
-
[eval debug] first 3 batch fingerprints:
|
| 2687 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2688 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2689 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2690 |
-
ce_avg: 0.0, mse_avg: 0.008206211030483246
|
| 2691 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step3000
|
| 2692 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 2693 |
-
[eval debug] first 3 batch fingerprints:
|
| 2694 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2695 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2696 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2697 |
-
ce_avg: 0.0, mse_avg: 0.008431533351540565
|
| 2698 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step3500
|
| 2699 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 2700 |
-
[eval debug] first 3 batch fingerprints:
|
| 2701 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2702 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2703 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2704 |
-
ce_avg: 0.0, mse_avg: 0.0084471320733428
|
| 2705 |
[[34m2026-01-28 10:02:35[39m] (step=0002466) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2706 |
[[34m2026-01-28 10:02:42[39m] (step=0002467) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2707 |
[[34m2026-01-28 10:02:48[39m] (step=0002468) Train Loss mse: 0.0063, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
@@ -3615,6 +3608,27 @@ ce_avg: 0.0, mse_avg: 0.0084471320733428
|
|
| 3615 |
[[34m2026-01-28 11:41:24[39m] (step=0003376) Train Loss mse: 0.0065, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3616 |
[[34m2026-01-28 11:41:31[39m] (step=0003377) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3617 |
[[34m2026-01-28 11:41:37[39m] (step=0003378) Train Loss mse: 0.0068, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3618 |
[[34m2026-01-28 11:41:44[39m] (step=0003379) Train Loss mse: 0.0061, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3619 |
[[34m2026-01-28 11:41:50[39m] (step=0003380) Train Loss mse: 0.0074, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3620 |
[[34m2026-01-28 11:41:57[39m] (step=0003381) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
@@ -3669,20 +3683,6 @@ ce_avg: 0.0, mse_avg: 0.0084471320733428
|
|
| 3669 |
[[34m2026-01-28 11:47:14[39m] (step=0003430) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3670 |
[[34m2026-01-28 11:47:21[39m] (step=0003431) Train Loss mse: 0.0062, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3671 |
[[34m2026-01-28 11:47:27[39m] (step=0003432) Train Loss mse: 0.0065, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3672 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step4000
|
| 3673 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 3674 |
-
[eval debug] first 3 batch fingerprints:
|
| 3675 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3676 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3677 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3678 |
-
ce_avg: 0.0, mse_avg: 0.008800854906439781
|
| 3679 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step4500
|
| 3680 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 3681 |
-
[eval debug] first 3 batch fingerprints:
|
| 3682 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3683 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3684 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3685 |
-
ce_avg: 0.0, mse_avg: 0.009047330357134342
|
| 3686 |
[[34m2026-01-28 11:47:34[39m] (step=0003433) Train Loss mse: 0.0069, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3687 |
[[34m2026-01-28 11:47:40[39m] (step=0003434) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3688 |
[[34m2026-01-28 11:47:47[39m] (step=0003435) Train Loss mse: 0.0068, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
@@ -5084,6 +5084,13 @@ ce_avg: 0.0, mse_avg: 0.009047330357134342
|
|
| 5084 |
[[34m2026-01-28 14:19:22[39m] (step=0004831) Train Loss mse: 0.0069, Train Loss ce: 0.0000, Train Steps/Sec: 0.14,
|
| 5085 |
[[34m2026-01-28 14:19:28[39m] (step=0004832) Train Loss mse: 0.0069, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 5086 |
[[34m2026-01-28 14:19:35[39m] (step=0004833) Train Loss mse: 0.0065, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5087 |
[[34m2026-01-28 14:19:41[39m] (step=0004834) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5088 |
[[34m2026-01-28 14:19:48[39m] (step=0004835) Train Loss mse: 0.0075, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5089 |
[[34m2026-01-28 14:19:54[39m] (step=0004836) Train Loss mse: 0.0072, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
@@ -5192,13 +5199,6 @@ ce_avg: 0.0, mse_avg: 0.009047330357134342
|
|
| 5192 |
[[34m2026-01-28 14:31:03[39m] (step=0004939) Train Loss mse: 0.0076, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 5193 |
[[34m2026-01-28 14:31:09[39m] (step=0004940) Train Loss mse: 0.0101, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 5194 |
[[34m2026-01-28 14:31:16[39m] (step=0004941) Train Loss mse: 0.0061, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5195 |
-
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step5000
|
| 5196 |
-
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 5197 |
-
[eval debug] first 3 batch fingerprints:
|
| 5198 |
-
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 5199 |
-
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 5200 |
-
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 5201 |
-
ce_avg: 0.0, mse_avg: 0.008728216402232647
|
| 5202 |
[[34m2026-01-28 14:31:22[39m] (step=0004942) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5203 |
[[34m2026-01-28 14:31:29[39m] (step=0004943) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5204 |
[[34m2026-01-28 14:31:35[39m] (step=0004944) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
| 184 |
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 185 |
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 186 |
ce_avg: 0.0, mse_avg: 0.007629983127117157
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 187 |
wandb: Detected [huggingface_hub.inference] in use.
|
| 188 |
wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
|
| 189 |
wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
|
|
|
|
| 1228 |
[[34m2026-01-28 07:27:28[39m] (step=0001031) Train Loss mse: 0.0077, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1229 |
[[34m2026-01-28 07:27:34[39m] (step=0001032) Train Loss mse: 0.0074, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1230 |
[[34m2026-01-28 07:27:40[39m] (step=0001033) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1231 |
[[34m2026-01-28 07:27:47[39m] (step=0001034) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1232 |
[[34m2026-01-28 07:27:53[39m] (step=0001035) Train Loss mse: 0.0087, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1233 |
[[34m2026-01-28 07:28:00[39m] (step=0001036) Train Loss mse: 0.0074, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
| 1247 |
[[34m2026-01-28 07:29:29[39m] (step=0001050) Train Loss mse: 0.0083, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 1248 |
[[34m2026-01-28 07:29:36[39m] (step=0001051) Train Loss mse: 0.0079, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 1249 |
[[34m2026-01-28 07:29:42[39m] (step=0001052) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1250 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step1000
|
| 1251 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 1252 |
+
[eval debug] first 3 batch fingerprints:
|
| 1253 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1254 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1255 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1256 |
+
ce_avg: 0.0, mse_avg: 0.007755194790661335
|
| 1257 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step1500
|
| 1258 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 1259 |
+
[eval debug] first 3 batch fingerprints:
|
| 1260 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1261 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1262 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1263 |
+
ce_avg: 0.0, mse_avg: 0.00788091029971838
|
| 1264 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step2000
|
| 1265 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 1266 |
+
[eval debug] first 3 batch fingerprints:
|
| 1267 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1268 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1269 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 1270 |
+
ce_avg: 0.0, mse_avg: 0.008042296394705772
|
| 1271 |
[[34m2026-01-28 07:29:49[39m] (step=0001053) Train Loss mse: 0.0081, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1272 |
[[34m2026-01-28 07:29:55[39m] (step=0001054) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 1273 |
[[34m2026-01-28 07:30:01[39m] (step=0001055) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
| 2645 |
[[34m2026-01-28 09:58:23[39m] (step=0002427) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2646 |
[[34m2026-01-28 09:58:30[39m] (step=0002428) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2647 |
[[34m2026-01-28 09:58:36[39m] (step=0002429) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2648 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step2500
|
| 2649 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 2650 |
+
[eval debug] first 3 batch fingerprints:
|
| 2651 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2652 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2653 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2654 |
+
ce_avg: 0.0, mse_avg: 0.008206211030483246
|
| 2655 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step3000
|
| 2656 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 2657 |
+
[eval debug] first 3 batch fingerprints:
|
| 2658 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2659 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2660 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 2661 |
+
ce_avg: 0.0, mse_avg: 0.008431533351540565
|
| 2662 |
[[34m2026-01-28 09:58:42[39m] (step=0002430) Train Loss mse: 0.0063, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2663 |
[[34m2026-01-28 09:58:49[39m] (step=0002431) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2664 |
[[34m2026-01-28 09:58:56[39m] (step=0002432) Train Loss mse: 0.0072, Train Loss ce: 0.0000, Train Steps/Sec: 0.14,
|
|
|
|
| 2695 |
[[34m2026-01-28 10:02:15[39m] (step=0002463) Train Loss mse: 0.0075, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2696 |
[[34m2026-01-28 10:02:22[39m] (step=0002464) Train Loss mse: 0.0084, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 2697 |
[[34m2026-01-28 10:02:28[39m] (step=0002465) Train Loss mse: 0.0072, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2698 |
[[34m2026-01-28 10:02:35[39m] (step=0002466) Train Loss mse: 0.0070, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2699 |
[[34m2026-01-28 10:02:42[39m] (step=0002467) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 2700 |
[[34m2026-01-28 10:02:48[39m] (step=0002468) Train Loss mse: 0.0063, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
| 3608 |
[[34m2026-01-28 11:41:24[39m] (step=0003376) Train Loss mse: 0.0065, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3609 |
[[34m2026-01-28 11:41:31[39m] (step=0003377) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3610 |
[[34m2026-01-28 11:41:37[39m] (step=0003378) Train Loss mse: 0.0068, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3611 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step3500
|
| 3612 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 3613 |
+
[eval debug] first 3 batch fingerprints:
|
| 3614 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3615 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3616 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3617 |
+
ce_avg: 0.0, mse_avg: 0.0084471320733428
|
| 3618 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step4000
|
| 3619 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 3620 |
+
[eval debug] first 3 batch fingerprints:
|
| 3621 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3622 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3623 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3624 |
+
ce_avg: 0.0, mse_avg: 0.008800854906439781
|
| 3625 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step4500
|
| 3626 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 3627 |
+
[eval debug] first 3 batch fingerprints:
|
| 3628 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3629 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3630 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 3631 |
+
ce_avg: 0.0, mse_avg: 0.009047330357134342
|
| 3632 |
[[34m2026-01-28 11:41:44[39m] (step=0003379) Train Loss mse: 0.0061, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3633 |
[[34m2026-01-28 11:41:50[39m] (step=0003380) Train Loss mse: 0.0074, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3634 |
[[34m2026-01-28 11:41:57[39m] (step=0003381) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
|
|
| 3683 |
[[34m2026-01-28 11:47:14[39m] (step=0003430) Train Loss mse: 0.0073, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3684 |
[[34m2026-01-28 11:47:21[39m] (step=0003431) Train Loss mse: 0.0062, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3685 |
[[34m2026-01-28 11:47:27[39m] (step=0003432) Train Loss mse: 0.0065, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3686 |
[[34m2026-01-28 11:47:34[39m] (step=0003433) Train Loss mse: 0.0069, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 3687 |
[[34m2026-01-28 11:47:40[39m] (step=0003434) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 3688 |
[[34m2026-01-28 11:47:47[39m] (step=0003435) Train Loss mse: 0.0068, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
|
|
|
| 5084 |
[[34m2026-01-28 14:19:22[39m] (step=0004831) Train Loss mse: 0.0069, Train Loss ce: 0.0000, Train Steps/Sec: 0.14,
|
| 5085 |
[[34m2026-01-28 14:19:28[39m] (step=0004832) Train Loss mse: 0.0069, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 5086 |
[[34m2026-01-28 14:19:35[39m] (step=0004833) Train Loss mse: 0.0065, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5087 |
+
base_dir is /dev/shm/models/checkpoints_vlm_gym_match_move_fix3_unit_one_image_lr2e_5_mse_only_ins/eval_used_rows, step_tag is vlm_gym_match_move_fix3_unit_one_img_lr2e_5_mse_only_ins_step5000
|
| 5088 |
+
Preparing Dataset vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce/vlm_gym_match_move_fix3_unit_val
|
| 5089 |
+
[eval debug] first 3 batch fingerprints:
|
| 5090 |
+
fp[0]: [{'data_indexes': [0], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 5091 |
+
fp[1]: [{'data_indexes': [8], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 5092 |
+
fp[2]: [{'data_indexes': [16], 'worker_id': 0, 'dataset_name': 'vlm_gym_match_move_fix3_unit_mse_loss_only_evalonce'}]
|
| 5093 |
+
ce_avg: 0.0, mse_avg: 0.008728216402232647
|
| 5094 |
[[34m2026-01-28 14:19:41[39m] (step=0004834) Train Loss mse: 0.0078, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5095 |
[[34m2026-01-28 14:19:48[39m] (step=0004835) Train Loss mse: 0.0075, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5096 |
[[34m2026-01-28 14:19:54[39m] (step=0004836) Train Loss mse: 0.0072, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
|
|
| 5199 |
[[34m2026-01-28 14:31:03[39m] (step=0004939) Train Loss mse: 0.0076, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 5200 |
[[34m2026-01-28 14:31:09[39m] (step=0004940) Train Loss mse: 0.0101, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|
| 5201 |
[[34m2026-01-28 14:31:16[39m] (step=0004941) Train Loss mse: 0.0061, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5202 |
[[34m2026-01-28 14:31:22[39m] (step=0004942) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5203 |
[[34m2026-01-28 14:31:29[39m] (step=0004943) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.15,
|
| 5204 |
[[34m2026-01-28 14:31:35[39m] (step=0004944) Train Loss mse: 0.0067, Train Loss ce: 0.0000, Train Steps/Sec: 0.16,
|