diff --git "a/fhn/gridsearch_01-29-1048/logging/train.log" "b/fhn/gridsearch_01-29-1048/logging/train.log" new file mode 100644--- /dev/null +++ "b/fhn/gridsearch_01-29-1048/logging/train.log" @@ -0,0 +1,600 @@ +RANK_0 - 2026-01-29 10:48:34,450 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 1.125552 grad_norm_before_clip: 11.607695 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:48:38,674 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 1.125552 grad_norm_before_clip: 11.607695 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:48:38,675 - TRAIN-LOGGER - INFO - Epoch 201 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 1.040020 +RANK_0 - 2026-01-29 10:48:52,986 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 1.040020 grad_norm_before_clip: 14.621938 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:48:57,105 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 1.040020 grad_norm_before_clip: 14.621938 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:48:57,105 - TRAIN-LOGGER - INFO - Epoch 202 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.963503 +RANK_0 - 2026-01-29 10:49:10,658 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.963503 grad_norm_before_clip: 24.243734 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:49:15,077 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.963503 grad_norm_before_clip: 24.243734 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:49:15,077 - TRAIN-LOGGER - INFO - Epoch 203 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.979025 +RANK_0 - 2026-01-29 10:49:27,975 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.979025 grad_norm_before_clip: 15.363961 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:49:32,139 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.979025 grad_norm_before_clip: 15.363961 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:49:32,139 - TRAIN-LOGGER - INFO - Epoch 204 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 1.044125 +RANK_0 - 2026-01-29 10:49:44,980 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 1.044125 grad_norm_before_clip: 45.537395 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:49:49,088 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 1.044125 grad_norm_before_clip: 45.537395 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:49:49,089 - TRAIN-LOGGER - INFO - Epoch 205 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 1.027321 +RANK_0 - 2026-01-29 10:50:02,339 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 1.027321 grad_norm_before_clip: 45.602810 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:50:06,470 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 1.027321 grad_norm_before_clip: 45.602810 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:50:06,470 - TRAIN-LOGGER - INFO - Epoch 206 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.935387 +RANK_0 - 2026-01-29 10:50:19,951 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.935387 grad_norm_before_clip: 16.925451 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:50:24,236 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.935387 grad_norm_before_clip: 16.925451 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:50:24,236 - TRAIN-LOGGER - INFO - Epoch 207 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.926938 +RANK_0 - 2026-01-29 10:50:37,658 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.926938 grad_norm_before_clip: 31.694639 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:50:41,755 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.926938 grad_norm_before_clip: 31.694639 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:50:41,755 - TRAIN-LOGGER - INFO - Epoch 208 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882477 weight_norm_u: 25.222990 loss: 0.901878 +RANK_0 - 2026-01-29 10:51:00,706 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN - Minibatch 0: weight_norm_model: 143.882477 loss: 0.901878 grad_norm_before_clip: 19.180050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:04,792 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882477 weight_norm_u: 25.218954 loss: 0.901878 grad_norm_before_clip: 19.180050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:04,792 - TRAIN-LOGGER - INFO - Epoch 209 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882446 weight_norm_u: 25.222990 loss: 0.921683 +RANK_0 - 2026-01-29 10:51:17,979 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN - Minibatch 0: weight_norm_model: 143.882446 loss: 0.921683 grad_norm_before_clip: 48.855667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:22,143 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882446 weight_norm_u: 25.218954 loss: 0.921683 grad_norm_before_clip: 48.855667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:22,143 - TRAIN-LOGGER - INFO - Epoch 210 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882462 weight_norm_u: 25.222990 loss: 0.924406 +RANK_0 - 2026-01-29 10:51:35,506 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN - Minibatch 0: weight_norm_model: 143.882462 loss: 0.924406 grad_norm_before_clip: 18.627853 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:39,551 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882462 weight_norm_u: 25.218954 loss: 0.924406 grad_norm_before_clip: 18.627853 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:39,551 - TRAIN-LOGGER - INFO - Epoch 211 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882477 weight_norm_u: 25.222990 loss: 0.911341 +RANK_0 - 2026-01-29 10:51:52,863 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN - Minibatch 0: weight_norm_model: 143.882477 loss: 0.911341 grad_norm_before_clip: 22.007046 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:56,998 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882477 weight_norm_u: 25.218954 loss: 0.911341 grad_norm_before_clip: 22.007046 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:51:56,998 - TRAIN-LOGGER - INFO - Epoch 212 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882477 weight_norm_u: 25.222990 loss: 0.932676 +RANK_0 - 2026-01-29 10:52:09,757 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN - Minibatch 0: weight_norm_model: 143.882477 loss: 0.932676 grad_norm_before_clip: 57.545856 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:52:13,808 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882477 weight_norm_u: 25.218954 loss: 0.932676 grad_norm_before_clip: 57.545856 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:52:13,808 - TRAIN-LOGGER - INFO - Epoch 213 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.930281 +RANK_0 - 2026-01-29 10:52:26,557 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.930281 grad_norm_before_clip: 28.967165 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:52:30,689 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.930281 grad_norm_before_clip: 28.967165 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:52:30,689 - TRAIN-LOGGER - INFO - Epoch 214 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.912449 +RANK_0 - 2026-01-29 10:52:43,622 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.912449 grad_norm_before_clip: 39.331081 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:52:47,786 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.912449 grad_norm_before_clip: 39.331081 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:52:47,786 - TRAIN-LOGGER - INFO - Epoch 215 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.917241 +RANK_0 - 2026-01-29 10:53:00,639 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.917241 grad_norm_before_clip: 20.128529 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:04,725 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.917241 grad_norm_before_clip: 20.128529 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:04,725 - TRAIN-LOGGER - INFO - Epoch 216 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.935518 +RANK_0 - 2026-01-29 10:53:17,936 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.935518 grad_norm_before_clip: 44.704605 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:22,082 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.935518 grad_norm_before_clip: 44.704605 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:22,082 - TRAIN-LOGGER - INFO - Epoch 217 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.907812 +RANK_0 - 2026-01-29 10:53:35,304 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.907812 grad_norm_before_clip: 37.666924 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:39,411 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.907812 grad_norm_before_clip: 37.666924 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:39,411 - TRAIN-LOGGER - INFO - Epoch 218 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.919289 +RANK_0 - 2026-01-29 10:53:52,213 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.919289 grad_norm_before_clip: 30.263775 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:56,386 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.919289 grad_norm_before_clip: 30.263775 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:53:56,386 - TRAIN-LOGGER - INFO - Epoch 219 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.929701 +RANK_0 - 2026-01-29 10:54:09,206 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.929701 grad_norm_before_clip: 41.672333 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:54:13,299 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.929701 grad_norm_before_clip: 41.672333 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:54:13,299 - TRAIN-LOGGER - INFO - Epoch 220 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.899525 +RANK_0 - 2026-01-29 10:54:26,351 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.899525 grad_norm_before_clip: 38.734844 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:54:30,364 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.899525 grad_norm_before_clip: 38.734844 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:54:30,364 - TRAIN-LOGGER - INFO - Epoch 221 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.928052 +RANK_0 - 2026-01-29 10:54:43,358 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.928052 grad_norm_before_clip: 25.778116 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:54:47,492 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.928052 grad_norm_before_clip: 25.778116 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:54:47,493 - TRAIN-LOGGER - INFO - Epoch 222 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.946282 +RANK_0 - 2026-01-29 10:55:00,427 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.946282 grad_norm_before_clip: 32.167023 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:04,575 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.946282 grad_norm_before_clip: 32.167023 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:04,575 - TRAIN-LOGGER - INFO - Epoch 223 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.928573 +RANK_0 - 2026-01-29 10:55:17,281 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.928573 grad_norm_before_clip: 16.788692 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:21,393 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.928573 grad_norm_before_clip: 16.788692 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:21,394 - TRAIN-LOGGER - INFO - Epoch 224 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.907201 +RANK_0 - 2026-01-29 10:55:34,670 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.907201 grad_norm_before_clip: 17.725723 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:38,769 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.907201 grad_norm_before_clip: 17.725723 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:38,769 - TRAIN-LOGGER - INFO - Epoch 225 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882462 weight_norm_u: 25.222990 loss: 0.952927 +RANK_0 - 2026-01-29 10:55:51,864 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN - Minibatch 0: weight_norm_model: 143.882462 loss: 0.952927 grad_norm_before_clip: 52.117985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:56,003 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882462 weight_norm_u: 25.218954 loss: 0.952927 grad_norm_before_clip: 52.117985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:55:56,004 - TRAIN-LOGGER - INFO - Epoch 226 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882462 weight_norm_u: 25.222990 loss: 0.988180 +RANK_0 - 2026-01-29 10:56:08,874 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN - Minibatch 0: weight_norm_model: 143.882462 loss: 0.988180 grad_norm_before_clip: 50.623238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:56:13,014 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882462 weight_norm_u: 25.218954 loss: 0.988180 grad_norm_before_clip: 50.623238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:56:13,014 - TRAIN-LOGGER - INFO - Epoch 227 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882477 weight_norm_u: 25.222990 loss: 0.962141 +RANK_0 - 2026-01-29 10:56:25,873 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN - Minibatch 0: weight_norm_model: 143.882477 loss: 0.962141 grad_norm_before_clip: 50.571884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:56:30,025 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882477 weight_norm_u: 25.218954 loss: 0.962141 grad_norm_before_clip: 50.571884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:56:30,025 - TRAIN-LOGGER - INFO - Epoch 228 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.937215 +RANK_0 - 2026-01-29 10:56:43,348 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.937215 grad_norm_before_clip: 25.280809 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:56:47,439 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.937215 grad_norm_before_clip: 25.280809 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:56:47,439 - TRAIN-LOGGER - INFO - Epoch 229 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.937442 +RANK_0 - 2026-01-29 10:57:00,778 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.937442 grad_norm_before_clip: 44.134327 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:04,878 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.937442 grad_norm_before_clip: 44.134327 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:04,878 - TRAIN-LOGGER - INFO - Epoch 230 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.969348 +RANK_0 - 2026-01-29 10:57:17,656 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.969348 grad_norm_before_clip: 49.672195 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:21,815 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.969348 grad_norm_before_clip: 49.672195 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:21,815 - TRAIN-LOGGER - INFO - Epoch 231 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.953721 +RANK_0 - 2026-01-29 10:57:35,100 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.953721 grad_norm_before_clip: 43.711910 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:39,233 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.953721 grad_norm_before_clip: 43.711910 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:39,233 - TRAIN-LOGGER - INFO - Epoch 232 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.914219 +RANK_0 - 2026-01-29 10:57:52,440 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.914219 grad_norm_before_clip: 18.598679 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:56,576 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.914219 grad_norm_before_clip: 18.598679 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:57:56,577 - TRAIN-LOGGER - INFO - Epoch 233 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.903693 +RANK_0 - 2026-01-29 10:58:09,454 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.903693 grad_norm_before_clip: 19.656500 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:58:13,518 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.903693 grad_norm_before_clip: 19.656500 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:58:13,518 - TRAIN-LOGGER - INFO - Epoch 234 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.898336 +RANK_0 - 2026-01-29 10:58:26,760 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.898336 grad_norm_before_clip: 37.744648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:58:30,886 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.898336 grad_norm_before_clip: 37.744648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:58:30,886 - TRAIN-LOGGER - INFO - Epoch 235 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.896203 +RANK_0 - 2026-01-29 10:58:44,102 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.896203 grad_norm_before_clip: 18.335737 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:58:48,242 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.896203 grad_norm_before_clip: 18.335737 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:58:48,242 - TRAIN-LOGGER - INFO - Epoch 236 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882477 weight_norm_u: 25.222990 loss: 0.945811 +RANK_0 - 2026-01-29 10:59:01,002 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN - Minibatch 0: weight_norm_model: 143.882477 loss: 0.945811 grad_norm_before_clip: 53.716652 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:05,195 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882477 weight_norm_u: 25.218954 loss: 0.945811 grad_norm_before_clip: 53.716652 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:05,195 - TRAIN-LOGGER - INFO - Epoch 237 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882462 weight_norm_u: 25.222990 loss: 0.953438 +RANK_0 - 2026-01-29 10:59:17,774 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN - Minibatch 0: weight_norm_model: 143.882462 loss: 0.953438 grad_norm_before_clip: 53.497589 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:21,811 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882462 weight_norm_u: 25.218954 loss: 0.953438 grad_norm_before_clip: 53.497589 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:21,812 - TRAIN-LOGGER - INFO - Epoch 238 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882477 weight_norm_u: 25.222990 loss: 0.923796 +RANK_0 - 2026-01-29 10:59:35,180 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN - Minibatch 0: weight_norm_model: 143.882477 loss: 0.923796 grad_norm_before_clip: 51.484447 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:39,278 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882477 weight_norm_u: 25.218954 loss: 0.923796 grad_norm_before_clip: 51.484447 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:39,278 - TRAIN-LOGGER - INFO - Epoch 239 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.927072 +RANK_0 - 2026-01-29 10:59:52,604 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.927072 grad_norm_before_clip: 17.695969 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:56,786 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.927072 grad_norm_before_clip: 17.695969 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 10:59:56,786 - TRAIN-LOGGER - INFO - Epoch 240 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.925678 +RANK_0 - 2026-01-29 11:00:09,593 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.925678 grad_norm_before_clip: 18.177040 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:00:13,769 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.925678 grad_norm_before_clip: 18.177040 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:00:13,769 - TRAIN-LOGGER - INFO - Epoch 241 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.920685 +RANK_0 - 2026-01-29 11:00:26,501 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.920685 grad_norm_before_clip: 37.558975 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:00:30,667 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.920685 grad_norm_before_clip: 37.558975 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:00:30,667 - TRAIN-LOGGER - INFO - Epoch 242 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.883375 +RANK_0 - 2026-01-29 11:00:43,438 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.883375 grad_norm_before_clip: 7.849490 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:00:47,533 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.883375 grad_norm_before_clip: 7.849490 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:00:47,534 - TRAIN-LOGGER - INFO - Epoch 243 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.883055 +RANK_0 - 2026-01-29 11:01:00,923 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.883055 grad_norm_before_clip: 9.833366 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:05,171 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.883055 grad_norm_before_clip: 9.833366 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:05,171 - TRAIN-LOGGER - INFO - Epoch 244 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.888856 +RANK_0 - 2026-01-29 11:01:18,173 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.888856 grad_norm_before_clip: 39.196827 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:22,241 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.888856 grad_norm_before_clip: 39.196827 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:22,241 - TRAIN-LOGGER - INFO - Epoch 245 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.889987 +RANK_0 - 2026-01-29 11:01:35,057 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.889987 grad_norm_before_clip: 17.749525 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:39,237 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.889987 grad_norm_before_clip: 17.749525 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:39,237 - TRAIN-LOGGER - INFO - Epoch 246 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.887329 +RANK_0 - 2026-01-29 11:01:52,017 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.887329 grad_norm_before_clip: 17.427305 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:56,126 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.887329 grad_norm_before_clip: 17.427305 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:01:56,126 - TRAIN-LOGGER - INFO - Epoch 247 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.892385 +RANK_0 - 2026-01-29 11:02:09,359 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.892385 grad_norm_before_clip: 31.429008 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:02:13,519 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.892385 grad_norm_before_clip: 31.429008 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:02:13,519 - TRAIN-LOGGER - INFO - Epoch 248 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.892596 +RANK_0 - 2026-01-29 11:02:26,694 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.892596 grad_norm_before_clip: 20.992163 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:02:30,833 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.892596 grad_norm_before_clip: 20.992163 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:02:30,833 - TRAIN-LOGGER - INFO - Epoch 249 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.904964 +RANK_0 - 2026-01-29 11:02:43,585 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.904964 grad_norm_before_clip: 38.743111 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:02:47,731 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.904964 grad_norm_before_clip: 38.743111 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:02:47,731 - TRAIN-LOGGER - INFO - Epoch 250 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.902487 +RANK_0 - 2026-01-29 11:03:00,735 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.902487 grad_norm_before_clip: 38.510406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:04,860 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.902487 grad_norm_before_clip: 38.510406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:04,860 - TRAIN-LOGGER - INFO - Epoch 251 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.888767 +RANK_0 - 2026-01-29 11:03:17,913 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.888767 grad_norm_before_clip: 27.097958 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:22,056 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.888767 grad_norm_before_clip: 27.097958 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:22,056 - TRAIN-LOGGER - INFO - Epoch 252 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.883357 +RANK_0 - 2026-01-29 11:03:35,170 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.883357 grad_norm_before_clip: 36.567730 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:39,174 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.883357 grad_norm_before_clip: 36.567730 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:39,174 - TRAIN-LOGGER - INFO - Epoch 253 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.894446 +RANK_0 - 2026-01-29 11:03:52,478 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.894446 grad_norm_before_clip: 37.533833 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:56,585 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.894446 grad_norm_before_clip: 37.533833 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:03:56,585 - TRAIN-LOGGER - INFO - Epoch 254 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.894169 +RANK_0 - 2026-01-29 11:04:09,744 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.894169 grad_norm_before_clip: 24.580585 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:04:13,781 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.894169 grad_norm_before_clip: 24.580585 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:04:13,781 - TRAIN-LOGGER - INFO - Epoch 255 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.891068 +RANK_0 - 2026-01-29 11:04:26,967 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.891068 grad_norm_before_clip: 35.976139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:04:31,132 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.891068 grad_norm_before_clip: 35.976139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:04:31,133 - TRAIN-LOGGER - INFO - Epoch 256 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.889440 +RANK_0 - 2026-01-29 11:04:43,993 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.889440 grad_norm_before_clip: 35.838421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:04:48,146 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.889440 grad_norm_before_clip: 35.838421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:04:48,146 - TRAIN-LOGGER - INFO - Epoch 257 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.898399 +RANK_0 - 2026-01-29 11:05:01,108 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.898399 grad_norm_before_clip: 24.071814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:05,185 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.898399 grad_norm_before_clip: 24.071814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:05,185 - TRAIN-LOGGER - INFO - Epoch 258 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.900347 +RANK_0 - 2026-01-29 11:05:18,446 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.900347 grad_norm_before_clip: 37.856548 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:22,595 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.900347 grad_norm_before_clip: 37.856548 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:22,596 - TRAIN-LOGGER - INFO - Epoch 259 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.884798 +RANK_0 - 2026-01-29 11:05:35,610 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.884798 grad_norm_before_clip: 33.195530 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:39,749 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.884798 grad_norm_before_clip: 33.195530 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:39,749 - TRAIN-LOGGER - INFO - Epoch 260 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.879322 +RANK_0 - 2026-01-29 11:05:52,767 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.879322 grad_norm_before_clip: 25.648233 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:56,861 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.879322 grad_norm_before_clip: 25.648233 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:05:56,862 - TRAIN-LOGGER - INFO - Epoch 261 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.904234 +RANK_0 - 2026-01-29 11:06:10,005 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.904234 grad_norm_before_clip: 37.897583 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:06:14,156 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.904234 grad_norm_before_clip: 37.897583 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:06:14,156 - TRAIN-LOGGER - INFO - Epoch 262 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.905276 +RANK_0 - 2026-01-29 11:06:27,300 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.905276 grad_norm_before_clip: 37.400185 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:06:31,320 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.905276 grad_norm_before_clip: 37.400185 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:06:31,320 - TRAIN-LOGGER - INFO - Epoch 263 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.880981 +RANK_0 - 2026-01-29 11:06:44,112 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.880981 grad_norm_before_clip: 33.569633 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:06:48,251 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.880981 grad_norm_before_clip: 33.569633 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:06:48,251 - TRAIN-LOGGER - INFO - Epoch 264 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.878644 +RANK_0 - 2026-01-29 11:07:01,169 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.878644 grad_norm_before_clip: 7.290102 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:05,357 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.878644 grad_norm_before_clip: 7.290102 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:05,358 - TRAIN-LOGGER - INFO - Epoch 265 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.890417 +RANK_0 - 2026-01-29 11:07:18,411 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.890417 grad_norm_before_clip: 37.334484 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:22,599 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.890417 grad_norm_before_clip: 37.334484 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:22,600 - TRAIN-LOGGER - INFO - Epoch 266 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.898323 +RANK_0 - 2026-01-29 11:07:35,965 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.898323 grad_norm_before_clip: 19.010094 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:40,033 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.898323 grad_norm_before_clip: 19.010094 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:40,033 - TRAIN-LOGGER - INFO - Epoch 267 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.892073 +RANK_0 - 2026-01-29 11:07:52,893 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.892073 grad_norm_before_clip: 19.065529 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:57,042 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.892073 grad_norm_before_clip: 19.065529 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:07:57,042 - TRAIN-LOGGER - INFO - Epoch 268 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.911076 +RANK_0 - 2026-01-29 11:08:09,675 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.911076 grad_norm_before_clip: 39.539200 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:08:13,815 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.911076 grad_norm_before_clip: 39.539200 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:08:13,815 - TRAIN-LOGGER - INFO - Epoch 269 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.899872 +RANK_0 - 2026-01-29 11:08:27,074 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.899872 grad_norm_before_clip: 25.798616 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:08:31,156 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.899872 grad_norm_before_clip: 25.798616 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:08:31,156 - TRAIN-LOGGER - INFO - Epoch 270 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.888945 +RANK_0 - 2026-01-29 11:08:44,544 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.888945 grad_norm_before_clip: 41.521748 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:08:48,674 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.888945 grad_norm_before_clip: 41.521748 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:08:48,674 - TRAIN-LOGGER - INFO - Epoch 271 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.890647 +RANK_0 - 2026-01-29 11:09:01,542 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.890647 grad_norm_before_clip: 32.647320 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:05,718 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.890647 grad_norm_before_clip: 32.647320 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:05,718 - TRAIN-LOGGER - INFO - Epoch 272 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.898654 +RANK_0 - 2026-01-29 11:09:18,581 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.898654 grad_norm_before_clip: 18.813227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:22,704 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.898654 grad_norm_before_clip: 18.813227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:22,705 - TRAIN-LOGGER - INFO - Epoch 273 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.891411 +RANK_0 - 2026-01-29 11:09:35,988 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.891411 grad_norm_before_clip: 24.708864 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:40,127 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.891411 grad_norm_before_clip: 24.708864 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:40,127 - TRAIN-LOGGER - INFO - Epoch 274 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.891996 +RANK_0 - 2026-01-29 11:09:53,150 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.891996 grad_norm_before_clip: 27.900484 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:57,298 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.891996 grad_norm_before_clip: 27.900484 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:09:57,298 - TRAIN-LOGGER - INFO - Epoch 275 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.892704 +RANK_0 - 2026-01-29 11:10:09,973 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.892704 grad_norm_before_clip: 28.896227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:10:14,125 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.892704 grad_norm_before_clip: 28.896227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:10:14,125 - TRAIN-LOGGER - INFO - Epoch 276 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.892356 +RANK_0 - 2026-01-29 11:10:27,316 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.892356 grad_norm_before_clip: 24.356472 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:10:31,469 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.892356 grad_norm_before_clip: 24.356472 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:10:31,469 - TRAIN-LOGGER - INFO - Epoch 277 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.893217 +RANK_0 - 2026-01-29 11:10:44,639 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.893217 grad_norm_before_clip: 24.462336 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:10:48,746 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.893217 grad_norm_before_clip: 24.462336 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:10:48,746 - TRAIN-LOGGER - INFO - Epoch 278 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.894777 +RANK_0 - 2026-01-29 11:11:01,576 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.894777 grad_norm_before_clip: 20.834442 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:05,779 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.894777 grad_norm_before_clip: 20.834442 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:05,779 - TRAIN-LOGGER - INFO - Epoch 279 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.885822 +RANK_0 - 2026-01-29 11:11:18,554 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.885822 grad_norm_before_clip: 28.364222 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:22,660 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.885822 grad_norm_before_clip: 28.364222 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:22,660 - TRAIN-LOGGER - INFO - Epoch 280 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.890627 +RANK_0 - 2026-01-29 11:11:35,526 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.890627 grad_norm_before_clip: 27.050034 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:39,600 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.890627 grad_norm_before_clip: 27.050034 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:39,600 - TRAIN-LOGGER - INFO - Epoch 281 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.896289 +RANK_0 - 2026-01-29 11:11:52,280 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.896289 grad_norm_before_clip: 19.901567 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:56,454 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.896289 grad_norm_before_clip: 19.901567 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:11:56,455 - TRAIN-LOGGER - INFO - Epoch 282 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.898331 +RANK_0 - 2026-01-29 11:12:09,728 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.898331 grad_norm_before_clip: 26.636833 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:12:13,829 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.898331 grad_norm_before_clip: 26.636833 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:12:13,829 - TRAIN-LOGGER - INFO - Epoch 283 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.893831 +RANK_0 - 2026-01-29 11:12:26,983 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.893831 grad_norm_before_clip: 24.062582 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:12:31,114 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.893831 grad_norm_before_clip: 24.062582 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:12:31,114 - TRAIN-LOGGER - INFO - Epoch 284 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.886055 +RANK_0 - 2026-01-29 11:12:44,071 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.886055 grad_norm_before_clip: 26.877256 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:12:48,229 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.886055 grad_norm_before_clip: 26.877256 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:12:48,230 - TRAIN-LOGGER - INFO - Epoch 285 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.881726 +RANK_0 - 2026-01-29 11:13:01,489 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.881726 grad_norm_before_clip: 37.045666 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:05,660 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.881726 grad_norm_before_clip: 37.045666 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:05,660 - TRAIN-LOGGER - INFO - Epoch 286 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.896842 +RANK_0 - 2026-01-29 11:13:18,896 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.896842 grad_norm_before_clip: 30.499403 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:22,996 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.896842 grad_norm_before_clip: 30.499403 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:22,997 - TRAIN-LOGGER - INFO - Epoch 287 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.896257 +RANK_0 - 2026-01-29 11:13:35,928 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.896257 grad_norm_before_clip: 30.090874 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:39,970 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.896257 grad_norm_before_clip: 30.090874 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:39,970 - TRAIN-LOGGER - INFO - Epoch 288 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.891386 +RANK_0 - 2026-01-29 11:13:52,846 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.891386 grad_norm_before_clip: 11.163630 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:56,995 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.891386 grad_norm_before_clip: 11.163630 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:13:56,996 - TRAIN-LOGGER - INFO - Epoch 289 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882690 weight_norm_u: 25.222990 loss: 0.898505 +RANK_0 - 2026-01-29 11:14:10,204 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN - Minibatch 0: weight_norm_model: 143.882690 loss: 0.898505 grad_norm_before_clip: 38.394714 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:14:14,330 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882690 weight_norm_u: 25.218954 loss: 0.898505 grad_norm_before_clip: 38.394714 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:14:14,330 - TRAIN-LOGGER - INFO - Epoch 290 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.883303 +RANK_0 - 2026-01-29 11:14:27,517 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.883303 grad_norm_before_clip: 25.334377 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:14:31,705 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.883303 grad_norm_before_clip: 25.334377 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:14:31,706 - TRAIN-LOGGER - INFO - Epoch 291 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.910684 +RANK_0 - 2026-01-29 11:14:44,482 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.910684 grad_norm_before_clip: 39.450783 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:14:48,636 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.910684 grad_norm_before_clip: 39.450783 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:14:48,636 - TRAIN-LOGGER - INFO - Epoch 292 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.930667 +RANK_0 - 2026-01-29 11:15:01,892 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.930667 grad_norm_before_clip: 48.746258 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:06,046 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.930667 grad_norm_before_clip: 48.746258 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:06,046 - TRAIN-LOGGER - INFO - Epoch 293 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.903792 +RANK_0 - 2026-01-29 11:15:19,322 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.903792 grad_norm_before_clip: 39.331814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:23,502 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.903792 grad_norm_before_clip: 39.331814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:23,502 - TRAIN-LOGGER - INFO - Epoch 294 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882690 weight_norm_u: 25.222990 loss: 0.900593 +RANK_0 - 2026-01-29 11:15:36,274 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN - Minibatch 0: weight_norm_model: 143.882690 loss: 0.900593 grad_norm_before_clip: 19.155552 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:40,373 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882690 weight_norm_u: 25.218954 loss: 0.900593 grad_norm_before_clip: 19.155552 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:40,373 - TRAIN-LOGGER - INFO - Epoch 295 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.907602 +RANK_0 - 2026-01-29 11:15:53,217 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.907602 grad_norm_before_clip: 37.848541 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:57,319 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.907602 grad_norm_before_clip: 37.848541 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:15:57,319 - TRAIN-LOGGER - INFO - Epoch 296 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.898853 +RANK_0 - 2026-01-29 11:16:10,681 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.898853 grad_norm_before_clip: 38.858055 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:16:14,795 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.898853 grad_norm_before_clip: 38.858055 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:16:14,795 - TRAIN-LOGGER - INFO - Epoch 297 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.889080 +RANK_0 - 2026-01-29 11:16:27,939 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.889080 grad_norm_before_clip: 36.970993 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:16:32,073 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.889080 grad_norm_before_clip: 36.970993 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:16:32,073 - TRAIN-LOGGER - INFO - Epoch 298 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.896219 +RANK_0 - 2026-01-29 11:16:44,916 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.896219 grad_norm_before_clip: 36.673149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:16:49,065 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.896219 grad_norm_before_clip: 36.673149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:16:49,066 - TRAIN-LOGGER - INFO - Epoch 299 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882690 weight_norm_u: 25.222990 loss: 0.877483 +RANK_0 - 2026-01-29 11:17:02,557 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN - Minibatch 0: weight_norm_model: 143.882690 loss: 0.877483 grad_norm_before_clip: 12.139236 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:06,641 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882690 weight_norm_u: 25.218954 loss: 0.877483 grad_norm_before_clip: 12.139236 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:06,641 - TRAIN-LOGGER - INFO - Epoch 300 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.924792 +RANK_0 - 2026-01-29 11:17:19,646 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.924792 grad_norm_before_clip: 43.219028 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:23,763 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.924792 grad_norm_before_clip: 43.219028 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:23,763 - TRAIN-LOGGER - INFO - Epoch 301 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.946971 +RANK_0 - 2026-01-29 11:17:36,454 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.946971 grad_norm_before_clip: 43.388348 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:40,597 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.946971 grad_norm_before_clip: 43.388348 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:40,597 - TRAIN-LOGGER - INFO - Epoch 302 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.929532 +RANK_0 - 2026-01-29 11:17:53,414 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.929532 grad_norm_before_clip: 42.223404 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:57,578 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.929532 grad_norm_before_clip: 42.223404 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:17:57,579 - TRAIN-LOGGER - INFO - Epoch 303 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.882351 +RANK_0 - 2026-01-29 11:18:10,761 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.882351 grad_norm_before_clip: 10.849648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:18:14,797 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.882351 grad_norm_before_clip: 10.849648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:18:14,797 - TRAIN-LOGGER - INFO - Epoch 304 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.920565 +RANK_0 - 2026-01-29 11:18:27,907 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.920565 grad_norm_before_clip: 38.498028 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:18:32,050 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.920565 grad_norm_before_clip: 38.498028 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:18:32,051 - TRAIN-LOGGER - INFO - Epoch 305 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.942994 +RANK_0 - 2026-01-29 11:18:45,626 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.942994 grad_norm_before_clip: 48.640091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:18:49,739 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.942994 grad_norm_before_clip: 48.640091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:18:49,739 - TRAIN-LOGGER - INFO - Epoch 306 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.921877 +RANK_0 - 2026-01-29 11:19:02,920 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.921877 grad_norm_before_clip: 45.588547 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:07,060 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.921877 grad_norm_before_clip: 45.588547 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:07,060 - TRAIN-LOGGER - INFO - Epoch 307 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.899642 +RANK_0 - 2026-01-29 11:19:19,696 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.899642 grad_norm_before_clip: 17.824608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:23,849 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.899642 grad_norm_before_clip: 17.824608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:23,849 - TRAIN-LOGGER - INFO - Epoch 308 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.903787 +RANK_0 - 2026-01-29 11:19:37,234 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.903787 grad_norm_before_clip: 18.461882 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:41,312 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.903787 grad_norm_before_clip: 18.461882 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:41,312 - TRAIN-LOGGER - INFO - Epoch 309 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.886300 +RANK_0 - 2026-01-29 11:19:54,477 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.886300 grad_norm_before_clip: 24.797537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:58,597 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.886300 grad_norm_before_clip: 24.797537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:19:58,598 - TRAIN-LOGGER - INFO - Epoch 310 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.895561 +RANK_0 - 2026-01-29 11:20:11,424 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.895561 grad_norm_before_clip: 28.380690 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:20:15,582 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.895561 grad_norm_before_clip: 28.380690 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:20:15,582 - TRAIN-LOGGER - INFO - Epoch 311 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.911041 +RANK_0 - 2026-01-29 11:20:28,821 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.911041 grad_norm_before_clip: 22.129141 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:20:32,958 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.911041 grad_norm_before_clip: 22.129141 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:20:32,958 - TRAIN-LOGGER - INFO - Epoch 312 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.899735 +RANK_0 - 2026-01-29 11:20:46,058 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.899735 grad_norm_before_clip: 19.853888 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:20:50,184 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.899735 grad_norm_before_clip: 19.853888 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:20:50,185 - TRAIN-LOGGER - INFO - Epoch 313 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.901197 +RANK_0 - 2026-01-29 11:21:03,005 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.901197 grad_norm_before_clip: 38.092007 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:07,150 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.901197 grad_norm_before_clip: 38.092007 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:07,150 - TRAIN-LOGGER - INFO - Epoch 314 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.909455 +RANK_0 - 2026-01-29 11:21:19,927 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.909455 grad_norm_before_clip: 37.751541 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:24,083 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.909455 grad_norm_before_clip: 37.751541 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:24,083 - TRAIN-LOGGER - INFO - Epoch 315 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.885361 +RANK_0 - 2026-01-29 11:21:37,298 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.885361 grad_norm_before_clip: 19.842043 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:41,414 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.885361 grad_norm_before_clip: 19.842043 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:41,415 - TRAIN-LOGGER - INFO - Epoch 316 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.914931 +RANK_0 - 2026-01-29 11:21:54,393 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.914931 grad_norm_before_clip: 34.833279 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:58,543 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.914931 grad_norm_before_clip: 34.833279 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:21:58,543 - TRAIN-LOGGER - INFO - Epoch 317 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.930597 +RANK_0 - 2026-01-29 11:22:11,365 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.930597 grad_norm_before_clip: 41.124821 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:22:15,503 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.930597 grad_norm_before_clip: 41.124821 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:22:15,503 - TRAIN-LOGGER - INFO - Epoch 318 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.911914 +RANK_0 - 2026-01-29 11:22:28,594 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.911914 grad_norm_before_clip: 34.504517 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:22:32,730 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.911914 grad_norm_before_clip: 34.504517 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:22:32,731 - TRAIN-LOGGER - INFO - Epoch 319 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882767 weight_norm_u: 25.222990 loss: 0.881215 +RANK_0 - 2026-01-29 11:22:46,016 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN - Minibatch 0: weight_norm_model: 143.882767 loss: 0.881215 grad_norm_before_clip: 19.619963 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:22:50,086 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882767 weight_norm_u: 25.218954 loss: 0.881215 grad_norm_before_clip: 19.619963 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:22:50,086 - TRAIN-LOGGER - INFO - Epoch 320 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882782 weight_norm_u: 25.222990 loss: 0.904618 +RANK_0 - 2026-01-29 11:23:02,938 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN - Minibatch 0: weight_norm_model: 143.882782 loss: 0.904618 grad_norm_before_clip: 37.788063 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:07,110 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882782 weight_norm_u: 25.218954 loss: 0.904618 grad_norm_before_clip: 37.788063 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:07,110 - TRAIN-LOGGER - INFO - Epoch 321 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882767 weight_norm_u: 25.222990 loss: 0.884132 +RANK_0 - 2026-01-29 11:23:20,603 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN - Minibatch 0: weight_norm_model: 143.882767 loss: 0.884132 grad_norm_before_clip: 37.328510 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:24,724 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882767 weight_norm_u: 25.218954 loss: 0.884132 grad_norm_before_clip: 37.328510 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:24,724 - TRAIN-LOGGER - INFO - Epoch 322 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.907004 +RANK_0 - 2026-01-29 11:23:37,924 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.907004 grad_norm_before_clip: 23.621923 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:42,079 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.907004 grad_norm_before_clip: 23.621923 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:42,079 - TRAIN-LOGGER - INFO - Epoch 323 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.914244 +RANK_0 - 2026-01-29 11:23:55,500 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.914244 grad_norm_before_clip: 29.922211 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:59,667 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.914244 grad_norm_before_clip: 29.922211 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:23:59,667 - TRAIN-LOGGER - INFO - Epoch 324 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.898342 +RANK_0 - 2026-01-29 11:24:12,595 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.898342 grad_norm_before_clip: 18.067183 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:24:16,747 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.898342 grad_norm_before_clip: 18.067183 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:24:16,748 - TRAIN-LOGGER - INFO - Epoch 325 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882782 weight_norm_u: 25.222990 loss: 0.892703 +RANK_0 - 2026-01-29 11:24:29,503 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN - Minibatch 0: weight_norm_model: 143.882782 loss: 0.892703 grad_norm_before_clip: 37.614567 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:24:33,673 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882782 weight_norm_u: 25.218954 loss: 0.892703 grad_norm_before_clip: 37.614567 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:24:33,673 - TRAIN-LOGGER - INFO - Epoch 326 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882782 weight_norm_u: 25.222990 loss: 0.900500 +RANK_0 - 2026-01-29 11:24:46,834 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN - Minibatch 0: weight_norm_model: 143.882782 loss: 0.900500 grad_norm_before_clip: 37.337502 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:24:50,971 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882782 weight_norm_u: 25.218954 loss: 0.900500 grad_norm_before_clip: 37.337502 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:24:50,971 - TRAIN-LOGGER - INFO - Epoch 327 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.884730 +RANK_0 - 2026-01-29 11:25:04,292 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.884730 grad_norm_before_clip: 18.692179 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:25:08,394 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.884730 grad_norm_before_clip: 18.692179 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:25:08,395 - TRAIN-LOGGER - INFO - Epoch 328 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.916977 +RANK_0 - 2026-01-29 11:25:21,203 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.916977 grad_norm_before_clip: 46.908810 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:25:25,222 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.916977 grad_norm_before_clip: 46.908810 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:25:25,222 - TRAIN-LOGGER - INFO - Epoch 329 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.931860 +RANK_0 - 2026-01-29 11:25:40,364 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.931860 grad_norm_before_clip: 49.964176 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:25:44,479 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.931860 grad_norm_before_clip: 49.964176 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:25:44,479 - TRAIN-LOGGER - INFO - Epoch 330 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.905575 +RANK_0 - 2026-01-29 11:25:57,327 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.905575 grad_norm_before_clip: 46.299583 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:01,473 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.905575 grad_norm_before_clip: 46.299583 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:01,474 - TRAIN-LOGGER - INFO - Epoch 331 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882782 weight_norm_u: 25.222990 loss: 0.881701 +RANK_0 - 2026-01-29 11:26:14,893 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN - Minibatch 0: weight_norm_model: 143.882782 loss: 0.881701 grad_norm_before_clip: 24.810884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:18,998 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882782 weight_norm_u: 25.218954 loss: 0.881701 grad_norm_before_clip: 24.810884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:18,999 - TRAIN-LOGGER - INFO - Epoch 332 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882797 weight_norm_u: 25.222990 loss: 0.887385 +RANK_0 - 2026-01-29 11:26:32,273 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN - Minibatch 0: weight_norm_model: 143.882797 loss: 0.887385 grad_norm_before_clip: 37.586781 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:36,433 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882797 weight_norm_u: 25.218954 loss: 0.887385 grad_norm_before_clip: 37.586781 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:36,433 - TRAIN-LOGGER - INFO - Epoch 333 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882782 weight_norm_u: 25.222990 loss: 0.879023 +RANK_0 - 2026-01-29 11:26:49,222 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN - Minibatch 0: weight_norm_model: 143.882782 loss: 0.879023 grad_norm_before_clip: 17.558868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:53,420 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882782 weight_norm_u: 25.218954 loss: 0.879023 grad_norm_before_clip: 17.558868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:26:53,420 - TRAIN-LOGGER - INFO - Epoch 334 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882797 weight_norm_u: 25.222990 loss: 0.876694 +RANK_0 - 2026-01-29 11:27:06,655 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN - Minibatch 0: weight_norm_model: 143.882797 loss: 0.876694 grad_norm_before_clip: 10.322866 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:27:10,805 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882797 weight_norm_u: 25.218954 loss: 0.876694 grad_norm_before_clip: 10.322866 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:27:10,806 - TRAIN-LOGGER - INFO - Epoch 335 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.898539 +RANK_0 - 2026-01-29 11:27:24,213 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.898539 grad_norm_before_clip: 37.657276 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:27:28,378 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.898539 grad_norm_before_clip: 37.657276 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:27:28,378 - TRAIN-LOGGER - INFO - Epoch 336 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.897767 +RANK_0 - 2026-01-29 11:27:41,127 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.897767 grad_norm_before_clip: 23.684900 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:27:45,289 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.897767 grad_norm_before_clip: 23.684900 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:27:45,290 - TRAIN-LOGGER - INFO - Epoch 337 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882797 weight_norm_u: 25.222990 loss: 0.876709 +RANK_0 - 2026-01-29 11:27:58,470 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN - Minibatch 0: weight_norm_model: 143.882797 loss: 0.876709 grad_norm_before_clip: 8.147664 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:02,622 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882797 weight_norm_u: 25.218954 loss: 0.876709 grad_norm_before_clip: 8.147664 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:02,622 - TRAIN-LOGGER - INFO - Epoch 338 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882797 weight_norm_u: 25.222990 loss: 0.892663 +RANK_0 - 2026-01-29 11:28:15,814 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN - Minibatch 0: weight_norm_model: 143.882797 loss: 0.892663 grad_norm_before_clip: 35.431343 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:19,977 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882797 weight_norm_u: 25.218954 loss: 0.892663 grad_norm_before_clip: 35.431343 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:19,977 - TRAIN-LOGGER - INFO - Epoch 339 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.891990 +RANK_0 - 2026-01-29 11:28:32,675 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.891990 grad_norm_before_clip: 27.085119 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:36,855 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.891990 grad_norm_before_clip: 27.085119 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:36,856 - TRAIN-LOGGER - INFO - Epoch 340 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.888795 +RANK_0 - 2026-01-29 11:28:49,738 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.888795 grad_norm_before_clip: 21.876072 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:53,924 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.888795 grad_norm_before_clip: 21.876072 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:28:53,924 - TRAIN-LOGGER - INFO - Epoch 341 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882858 weight_norm_u: 25.222990 loss: 0.897227 +RANK_0 - 2026-01-29 11:29:07,017 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN - Minibatch 0: weight_norm_model: 143.882858 loss: 0.897227 grad_norm_before_clip: 37.727242 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:29:11,190 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882858 weight_norm_u: 25.218954 loss: 0.897227 grad_norm_before_clip: 37.727242 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:29:11,190 - TRAIN-LOGGER - INFO - Epoch 342 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.892289 +RANK_0 - 2026-01-29 11:29:24,216 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.892289 grad_norm_before_clip: 17.594501 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:29:28,364 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.892289 grad_norm_before_clip: 17.594501 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:29:28,364 - TRAIN-LOGGER - INFO - Epoch 343 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.883254 +RANK_0 - 2026-01-29 11:29:41,225 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.883254 grad_norm_before_clip: 17.530872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:29:45,297 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.883254 grad_norm_before_clip: 17.530872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:29:45,298 - TRAIN-LOGGER - INFO - Epoch 344 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.886093 +RANK_0 - 2026-01-29 11:29:58,692 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.886093 grad_norm_before_clip: 24.823948 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:02,864 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.886093 grad_norm_before_clip: 24.823948 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:02,864 - TRAIN-LOGGER - INFO - Epoch 345 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882828 weight_norm_u: 25.222990 loss: 0.891260 +RANK_0 - 2026-01-29 11:30:15,961 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN - Minibatch 0: weight_norm_model: 143.882828 loss: 0.891260 grad_norm_before_clip: 18.193964 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:19,920 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882828 weight_norm_u: 25.218954 loss: 0.891260 grad_norm_before_clip: 18.193964 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:19,920 - TRAIN-LOGGER - INFO - Epoch 346 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.905778 +RANK_0 - 2026-01-29 11:30:32,793 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.905778 grad_norm_before_clip: 47.040054 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:36,973 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.905778 grad_norm_before_clip: 47.040054 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:36,974 - TRAIN-LOGGER - INFO - Epoch 347 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.904653 +RANK_0 - 2026-01-29 11:30:49,749 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.904653 grad_norm_before_clip: 46.864666 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:53,889 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.904653 grad_norm_before_clip: 46.864666 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:30:53,890 - TRAIN-LOGGER - INFO - Epoch 348 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882828 weight_norm_u: 25.222990 loss: 0.888911 +RANK_0 - 2026-01-29 11:31:07,147 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN - Minibatch 0: weight_norm_model: 143.882828 loss: 0.888911 grad_norm_before_clip: 17.777592 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:31:11,269 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882828 weight_norm_u: 25.218954 loss: 0.888911 grad_norm_before_clip: 17.777592 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:31:11,269 - TRAIN-LOGGER - INFO - Epoch 349 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.878356 +RANK_0 - 2026-01-29 11:31:24,289 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.878356 grad_norm_before_clip: 9.215642 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:31:28,428 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.878356 grad_norm_before_clip: 9.215642 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:31:28,429 - TRAIN-LOGGER - INFO - Epoch 350 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.879881 +RANK_0 - 2026-01-29 11:31:41,185 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.879881 grad_norm_before_clip: 17.967514 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:31:45,332 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.879881 grad_norm_before_clip: 17.967514 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:31:45,332 - TRAIN-LOGGER - INFO - Epoch 351 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.889949 +RANK_0 - 2026-01-29 11:31:58,212 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.889949 grad_norm_before_clip: 12.097375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:02,384 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.889949 grad_norm_before_clip: 12.097375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:02,384 - TRAIN-LOGGER - INFO - Epoch 352 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.887282 +RANK_0 - 2026-01-29 11:32:15,718 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.887282 grad_norm_before_clip: 11.386359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:19,860 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.887282 grad_norm_before_clip: 11.386359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:19,860 - TRAIN-LOGGER - INFO - Epoch 353 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.881473 +RANK_0 - 2026-01-29 11:32:32,744 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.881473 grad_norm_before_clip: 27.405949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:36,922 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.881473 grad_norm_before_clip: 27.405949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:36,922 - TRAIN-LOGGER - INFO - Epoch 354 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.884431 +RANK_0 - 2026-01-29 11:32:49,647 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.884431 grad_norm_before_clip: 24.307261 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:53,819 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.884431 grad_norm_before_clip: 24.307261 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:32:53,819 - TRAIN-LOGGER - INFO - Epoch 355 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.884971 +RANK_0 - 2026-01-29 11:33:07,166 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.884971 grad_norm_before_clip: 19.089712 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:33:11,265 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.884971 grad_norm_before_clip: 19.089712 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:33:11,265 - TRAIN-LOGGER - INFO - Epoch 356 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882858 weight_norm_u: 25.222990 loss: 0.901972 +RANK_0 - 2026-01-29 11:33:24,505 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN - Minibatch 0: weight_norm_model: 143.882858 loss: 0.901972 grad_norm_before_clip: 42.802097 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:33:28,617 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882858 weight_norm_u: 25.218954 loss: 0.901972 grad_norm_before_clip: 42.802097 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:33:28,617 - TRAIN-LOGGER - INFO - Epoch 357 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882858 weight_norm_u: 25.222990 loss: 0.901336 +RANK_0 - 2026-01-29 11:33:42,160 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN - Minibatch 0: weight_norm_model: 143.882858 loss: 0.901336 grad_norm_before_clip: 41.569748 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:33:46,330 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882858 weight_norm_u: 25.218954 loss: 0.901336 grad_norm_before_clip: 41.569748 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:33:46,330 - TRAIN-LOGGER - INFO - Epoch 358 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.876946 +RANK_0 - 2026-01-29 11:33:59,528 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.876946 grad_norm_before_clip: 15.405343 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:03,687 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.876946 grad_norm_before_clip: 15.405343 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:03,687 - TRAIN-LOGGER - INFO - Epoch 359 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.921210 +RANK_0 - 2026-01-29 11:34:16,502 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.921210 grad_norm_before_clip: 40.981743 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:20,575 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.921210 grad_norm_before_clip: 40.981743 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:20,575 - TRAIN-LOGGER - INFO - Epoch 360 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882950 weight_norm_u: 25.222990 loss: 0.943264 +RANK_0 - 2026-01-29 11:34:33,493 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN - Minibatch 0: weight_norm_model: 143.882950 loss: 0.943264 grad_norm_before_clip: 41.297909 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:37,656 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882950 weight_norm_u: 25.218954 loss: 0.943264 grad_norm_before_clip: 41.297909 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:37,657 - TRAIN-LOGGER - INFO - Epoch 361 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.925218 +RANK_0 - 2026-01-29 11:34:50,862 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.925218 grad_norm_before_clip: 42.505981 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:54,811 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.925218 grad_norm_before_clip: 42.505981 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:34:54,811 - TRAIN-LOGGER - INFO - Epoch 362 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882919 weight_norm_u: 25.222990 loss: 0.882441 +RANK_0 - 2026-01-29 11:35:07,956 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN - Minibatch 0: weight_norm_model: 143.882919 loss: 0.882441 grad_norm_before_clip: 16.275089 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:35:11,853 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882919 weight_norm_u: 25.218954 loss: 0.882441 grad_norm_before_clip: 16.275089 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:35:11,853 - TRAIN-LOGGER - INFO - Epoch 363 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882889 weight_norm_u: 25.222990 loss: 0.888975 +RANK_0 - 2026-01-29 11:35:24,711 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN - Minibatch 0: weight_norm_model: 143.882889 loss: 0.888975 grad_norm_before_clip: 25.596096 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:35:28,843 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882889 weight_norm_u: 25.218954 loss: 0.888975 grad_norm_before_clip: 25.596096 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:35:28,843 - TRAIN-LOGGER - INFO - Epoch 364 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882904 weight_norm_u: 25.222990 loss: 0.876399 +RANK_0 - 2026-01-29 11:35:41,855 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN - Minibatch 0: weight_norm_model: 143.882904 loss: 0.876399 grad_norm_before_clip: 9.789753 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:35:46,052 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882904 weight_norm_u: 25.218954 loss: 0.876399 grad_norm_before_clip: 9.789753 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:35:46,052 - TRAIN-LOGGER - INFO - Epoch 365 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.901449 +RANK_0 - 2026-01-29 11:35:59,173 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.901449 grad_norm_before_clip: 22.821161 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:03,335 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.901449 grad_norm_before_clip: 22.821161 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:03,336 - TRAIN-LOGGER - INFO - Epoch 366 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.910689 +RANK_0 - 2026-01-29 11:36:16,479 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.910689 grad_norm_before_clip: 27.528631 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:20,645 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.910689 grad_norm_before_clip: 27.528631 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:20,645 - TRAIN-LOGGER - INFO - Epoch 367 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882919 weight_norm_u: 25.222990 loss: 0.892292 +RANK_0 - 2026-01-29 11:36:33,498 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN - Minibatch 0: weight_norm_model: 143.882919 loss: 0.892292 grad_norm_before_clip: 18.148977 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:37,647 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882919 weight_norm_u: 25.218954 loss: 0.892292 grad_norm_before_clip: 18.148977 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:37,648 - TRAIN-LOGGER - INFO - Epoch 368 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882889 weight_norm_u: 25.222990 loss: 0.900522 +RANK_0 - 2026-01-29 11:36:51,025 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN - Minibatch 0: weight_norm_model: 143.882889 loss: 0.900522 grad_norm_before_clip: 40.214905 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:55,213 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882889 weight_norm_u: 25.218954 loss: 0.900522 grad_norm_before_clip: 40.214905 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:36:55,213 - TRAIN-LOGGER - INFO - Epoch 369 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882889 weight_norm_u: 25.222990 loss: 0.913310 +RANK_0 - 2026-01-29 11:37:08,278 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN - Minibatch 0: weight_norm_model: 143.882889 loss: 0.913310 grad_norm_before_clip: 41.299149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:37:12,385 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882889 weight_norm_u: 25.218954 loss: 0.913310 grad_norm_before_clip: 41.299149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:37:12,386 - TRAIN-LOGGER - INFO - Epoch 370 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882904 weight_norm_u: 25.222990 loss: 0.891411 +RANK_0 - 2026-01-29 11:37:25,329 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN - Minibatch 0: weight_norm_model: 143.882904 loss: 0.891411 grad_norm_before_clip: 23.961023 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:37:29,469 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882904 weight_norm_u: 25.218954 loss: 0.891411 grad_norm_before_clip: 23.961023 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:37:29,470 - TRAIN-LOGGER - INFO - Epoch 371 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882950 weight_norm_u: 25.222990 loss: 0.893157 +RANK_0 - 2026-01-29 11:37:42,859 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN - Minibatch 0: weight_norm_model: 143.882950 loss: 0.893157 grad_norm_before_clip: 35.909389 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:37:46,931 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882950 weight_norm_u: 25.218954 loss: 0.893157 grad_norm_before_clip: 35.909389 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:37:46,932 - TRAIN-LOGGER - INFO - Epoch 372 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882965 weight_norm_u: 25.222990 loss: 0.901087 +RANK_0 - 2026-01-29 11:37:59,935 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN - Minibatch 0: weight_norm_model: 143.882965 loss: 0.901087 grad_norm_before_clip: 36.233738 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:04,066 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882965 weight_norm_u: 25.218954 loss: 0.901087 grad_norm_before_clip: 36.233738 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:04,066 - TRAIN-LOGGER - INFO - Epoch 373 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882950 weight_norm_u: 25.222990 loss: 0.887842 +RANK_0 - 2026-01-29 11:38:16,876 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN - Minibatch 0: weight_norm_model: 143.882950 loss: 0.887842 grad_norm_before_clip: 12.394480 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:20,988 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882950 weight_norm_u: 25.218954 loss: 0.887842 grad_norm_before_clip: 12.394480 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:20,988 - TRAIN-LOGGER - INFO - Epoch 374 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.893645 +RANK_0 - 2026-01-29 11:38:33,881 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.893645 grad_norm_before_clip: 23.212797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:38,042 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.893645 grad_norm_before_clip: 23.212797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:38,042 - TRAIN-LOGGER - INFO - Epoch 375 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882919 weight_norm_u: 25.222990 loss: 0.897806 +RANK_0 - 2026-01-29 11:38:51,291 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN - Minibatch 0: weight_norm_model: 143.882919 loss: 0.897806 grad_norm_before_clip: 30.332407 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:55,449 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882919 weight_norm_u: 25.218954 loss: 0.897806 grad_norm_before_clip: 30.332407 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:38:55,450 - TRAIN-LOGGER - INFO - Epoch 376 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882950 weight_norm_u: 25.222990 loss: 0.872211 +RANK_0 - 2026-01-29 11:39:08,379 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN - Minibatch 0: weight_norm_model: 143.882950 loss: 0.872211 grad_norm_before_clip: 4.432117 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:39:12,467 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882950 weight_norm_u: 25.218954 loss: 0.872211 grad_norm_before_clip: 4.432117 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:39:12,467 - TRAIN-LOGGER - INFO - Epoch 377 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882950 weight_norm_u: 25.222990 loss: 0.872794 +RANK_0 - 2026-01-29 11:39:25,330 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN - Minibatch 0: weight_norm_model: 143.882950 loss: 0.872794 grad_norm_before_clip: 7.503301 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:39:29,503 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882950 weight_norm_u: 25.218954 loss: 0.872794 grad_norm_before_clip: 7.503301 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:39:29,504 - TRAIN-LOGGER - INFO - Epoch 378 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.888704 +RANK_0 - 2026-01-29 11:39:42,293 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.888704 grad_norm_before_clip: 32.293674 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:39:46,380 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.888704 grad_norm_before_clip: 32.293674 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:39:46,380 - TRAIN-LOGGER - INFO - Epoch 379 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882950 weight_norm_u: 25.222990 loss: 0.882431 +RANK_0 - 2026-01-29 11:39:59,154 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN - Minibatch 0: weight_norm_model: 143.882950 loss: 0.882431 grad_norm_before_clip: 23.829264 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:03,292 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882950 weight_norm_u: 25.218954 loss: 0.882431 grad_norm_before_clip: 23.829264 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:03,292 - TRAIN-LOGGER - INFO - Epoch 380 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882980 weight_norm_u: 25.222990 loss: 0.888334 +RANK_0 - 2026-01-29 11:40:16,437 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN - Minibatch 0: weight_norm_model: 143.882980 loss: 0.888334 grad_norm_before_clip: 38.870995 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:20,541 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882980 weight_norm_u: 25.218954 loss: 0.888334 grad_norm_before_clip: 38.870995 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:20,541 - TRAIN-LOGGER - INFO - Epoch 381 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.896537 +RANK_0 - 2026-01-29 11:40:33,839 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.896537 grad_norm_before_clip: 38.582809 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:37,907 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.896537 grad_norm_before_clip: 38.582809 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:37,908 - TRAIN-LOGGER - INFO - Epoch 382 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882980 weight_norm_u: 25.222990 loss: 0.877430 +RANK_0 - 2026-01-29 11:40:50,728 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN - Minibatch 0: weight_norm_model: 143.882980 loss: 0.877430 grad_norm_before_clip: 29.927364 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:54,867 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882980 weight_norm_u: 25.218954 loss: 0.877430 grad_norm_before_clip: 29.927364 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:40:54,867 - TRAIN-LOGGER - INFO - Epoch 383 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.875800 +RANK_0 - 2026-01-29 11:41:07,616 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.875800 grad_norm_before_clip: 4.885437 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:41:11,757 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.875800 grad_norm_before_clip: 4.885437 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:41:11,758 - TRAIN-LOGGER - INFO - Epoch 384 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.878220 +RANK_0 - 2026-01-29 11:41:25,048 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.878220 grad_norm_before_clip: 17.702223 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:41:29,171 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.878220 grad_norm_before_clip: 17.702223 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:41:29,171 - TRAIN-LOGGER - INFO - Epoch 385 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.874918 +RANK_0 - 2026-01-29 11:41:42,610 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.874918 grad_norm_before_clip: 15.906667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:41:46,706 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.874918 grad_norm_before_clip: 15.906667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:41:46,707 - TRAIN-LOGGER - INFO - Epoch 386 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883026 weight_norm_u: 25.222990 loss: 0.875104 +RANK_0 - 2026-01-29 11:41:59,578 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN - Minibatch 0: weight_norm_model: 143.883026 loss: 0.875104 grad_norm_before_clip: 23.125250 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:03,713 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883026 weight_norm_u: 25.218954 loss: 0.875104 grad_norm_before_clip: 23.125250 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:03,713 - TRAIN-LOGGER - INFO - Epoch 387 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883026 weight_norm_u: 25.222990 loss: 0.881109 +RANK_0 - 2026-01-29 11:42:16,940 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN - Minibatch 0: weight_norm_model: 143.883026 loss: 0.881109 grad_norm_before_clip: 26.639015 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:21,039 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883026 weight_norm_u: 25.218954 loss: 0.881109 grad_norm_before_clip: 26.639015 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:21,040 - TRAIN-LOGGER - INFO - Epoch 388 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883041 weight_norm_u: 25.222990 loss: 0.875450 +RANK_0 - 2026-01-29 11:42:34,234 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN - Minibatch 0: weight_norm_model: 143.883041 loss: 0.875450 grad_norm_before_clip: 27.268002 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:38,328 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883041 weight_norm_u: 25.218954 loss: 0.875450 grad_norm_before_clip: 27.268002 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:38,328 - TRAIN-LOGGER - INFO - Epoch 389 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.912925 +RANK_0 - 2026-01-29 11:42:51,113 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.912925 grad_norm_before_clip: 37.466087 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:55,234 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.912925 grad_norm_before_clip: 37.466087 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:42:55,234 - TRAIN-LOGGER - INFO - Epoch 390 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.929986 +RANK_0 - 2026-01-29 11:43:08,070 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.929986 grad_norm_before_clip: 38.473362 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:43:12,210 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.929986 grad_norm_before_clip: 38.473362 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:43:12,210 - TRAIN-LOGGER - INFO - Epoch 391 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.903414 +RANK_0 - 2026-01-29 11:43:25,611 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.903414 grad_norm_before_clip: 31.705025 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:43:29,769 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.903414 grad_norm_before_clip: 31.705025 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:43:29,770 - TRAIN-LOGGER - INFO - Epoch 392 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.890964 +RANK_0 - 2026-01-29 11:43:42,777 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.890964 grad_norm_before_clip: 25.725634 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:43:46,957 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.890964 grad_norm_before_clip: 25.725634 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:43:46,957 - TRAIN-LOGGER - INFO - Epoch 393 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.903074 +RANK_0 - 2026-01-29 11:43:59,912 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.903074 grad_norm_before_clip: 28.373789 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:03,988 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.903074 grad_norm_before_clip: 28.373789 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:03,989 - TRAIN-LOGGER - INFO - Epoch 394 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.879324 +RANK_0 - 2026-01-29 11:44:17,148 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.879324 grad_norm_before_clip: 26.635891 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:21,318 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.879324 grad_norm_before_clip: 26.635891 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:21,319 - TRAIN-LOGGER - INFO - Epoch 395 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.908134 +RANK_0 - 2026-01-29 11:44:34,512 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.908134 grad_norm_before_clip: 36.206577 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:38,683 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.908134 grad_norm_before_clip: 36.206577 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:38,683 - TRAIN-LOGGER - INFO - Epoch 396 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883102 weight_norm_u: 25.222990 loss: 0.922456 +RANK_0 - 2026-01-29 11:44:51,467 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN - Minibatch 0: weight_norm_model: 143.883102 loss: 0.922456 grad_norm_before_clip: 40.329746 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:55,593 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883102 weight_norm_u: 25.218954 loss: 0.922456 grad_norm_before_clip: 40.329746 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:44:55,593 - TRAIN-LOGGER - INFO - Epoch 397 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.898572 +RANK_0 - 2026-01-29 11:45:08,776 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.898572 grad_norm_before_clip: 39.611889 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:45:12,960 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.898572 grad_norm_before_clip: 39.611889 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:45:12,960 - TRAIN-LOGGER - INFO - Epoch 398 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.881180 +RANK_0 - 2026-01-29 11:45:26,080 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.881180 grad_norm_before_clip: 37.078320 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:45:30,254 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.881180 grad_norm_before_clip: 37.078320 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:45:30,254 - TRAIN-LOGGER - INFO - Epoch 399 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883041 weight_norm_u: 25.222990 loss: 0.893162 +RANK_0 - 2026-01-29 11:45:43,071 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN - Minibatch 0: weight_norm_model: 143.883041 loss: 0.893162 grad_norm_before_clip: 37.950584 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:45:47,139 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883041 weight_norm_u: 25.218954 loss: 0.893162 grad_norm_before_clip: 37.950584 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 11:45:47,139 - TRAIN-LOGGER - INFO - Epoch 400 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.877628