diff --git "a/mocap35short/mocap35short_01-29-0614/logging/train.log" "b/mocap35short/mocap35short_01-29-0614/logging/train.log" new file mode 100644--- /dev/null +++ "b/mocap35short/mocap35short_01-29-0614/logging/train.log" @@ -0,0 +1,600 @@ +RANK_0 - 2026-01-29 06:14:49,244 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.086034 grad_norm_before_clip: 8.003169 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:50,508 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.086034 grad_norm_before_clip: 8.003169 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:50,508 - TRAIN-LOGGER - INFO - Epoch 201 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.045459 +RANK_0 - 2026-01-29 06:14:56,893 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.048763 grad_norm_before_clip: 2.188227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:58,054 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.048763 grad_norm_before_clip: 2.188227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:58,054 - TRAIN-LOGGER - INFO - Epoch 202 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.039111 +RANK_0 - 2026-01-29 06:15:04,428 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.044838 grad_norm_before_clip: 2.402300 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:05,659 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.044838 grad_norm_before_clip: 2.402300 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:05,660 - TRAIN-LOGGER - INFO - Epoch 203 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.035583 +RANK_0 - 2026-01-29 06:15:11,850 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.055593 grad_norm_before_clip: 2.630228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:12,987 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.055593 grad_norm_before_clip: 2.630228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:12,987 - TRAIN-LOGGER - INFO - Epoch 204 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.034420 +RANK_0 - 2026-01-29 06:15:18,917 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.040559 grad_norm_before_clip: 2.294982 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:20,071 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.040559 grad_norm_before_clip: 2.294982 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:20,072 - TRAIN-LOGGER - INFO - Epoch 205 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.035253 +RANK_0 - 2026-01-29 06:15:27,498 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.051445 grad_norm_before_clip: 2.176439 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:28,719 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.051445 grad_norm_before_clip: 2.176439 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:28,719 - TRAIN-LOGGER - INFO - Epoch 206 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.034037 +RANK_0 - 2026-01-29 06:15:34,904 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.045527 grad_norm_before_clip: 2.185840 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:36,178 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.045527 grad_norm_before_clip: 2.185840 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:36,178 - TRAIN-LOGGER - INFO - Epoch 207 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.031931 +RANK_0 - 2026-01-29 06:15:42,522 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.036214 grad_norm_before_clip: 1.455611 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:43,929 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.036214 grad_norm_before_clip: 1.455611 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:43,929 - TRAIN-LOGGER - INFO - Epoch 208 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.031041 +RANK_0 - 2026-01-29 06:15:50,141 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.041449 grad_norm_before_clip: 1.244339 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:51,376 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.041449 grad_norm_before_clip: 1.244339 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:51,376 - TRAIN-LOGGER - INFO - Epoch 209 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.032548 +RANK_0 - 2026-01-29 06:15:57,878 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.043511 grad_norm_before_clip: 1.618099 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:59,140 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.043511 grad_norm_before_clip: 1.618099 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:59,141 - TRAIN-LOGGER - INFO - Epoch 210 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.033921 +RANK_0 - 2026-01-29 06:16:05,156 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.042637 grad_norm_before_clip: 1.715526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:06,459 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.042637 grad_norm_before_clip: 1.715526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:06,460 - TRAIN-LOGGER - INFO - Epoch 211 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.032794 +RANK_0 - 2026-01-29 06:16:12,536 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.043695 grad_norm_before_clip: 1.655050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:13,744 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.043695 grad_norm_before_clip: 1.655050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:13,744 - TRAIN-LOGGER - INFO - Epoch 212 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.030204 +RANK_0 - 2026-01-29 06:16:20,313 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.046108 grad_norm_before_clip: 2.078931 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:21,572 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.046108 grad_norm_before_clip: 2.078931 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:21,573 - TRAIN-LOGGER - INFO - Epoch 213 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.028451 +RANK_0 - 2026-01-29 06:16:28,212 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.046708 grad_norm_before_clip: 1.178537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:29,359 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.046708 grad_norm_before_clip: 1.178537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:29,359 - TRAIN-LOGGER - INFO - Epoch 214 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.029163 +RANK_0 - 2026-01-29 06:16:36,019 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.040793 grad_norm_before_clip: 1.309085 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:37,217 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.040793 grad_norm_before_clip: 1.309085 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:37,218 - TRAIN-LOGGER - INFO - Epoch 215 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.031473 +RANK_0 - 2026-01-29 06:16:43,970 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.038644 grad_norm_before_clip: 1.705190 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:45,133 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.038644 grad_norm_before_clip: 1.705190 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:45,134 - TRAIN-LOGGER - INFO - Epoch 216 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.033015 +RANK_0 - 2026-01-29 06:16:51,338 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.045583 grad_norm_before_clip: 2.523635 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:52,747 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.045583 grad_norm_before_clip: 2.523635 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:52,747 - TRAIN-LOGGER - INFO - Epoch 217 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.032378 +RANK_0 - 2026-01-29 06:16:59,604 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.039175 grad_norm_before_clip: 1.495353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:00,810 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.039175 grad_norm_before_clip: 1.495353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:00,810 - TRAIN-LOGGER - INFO - Epoch 218 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.029824 +RANK_0 - 2026-01-29 06:17:06,844 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.039350 grad_norm_before_clip: 0.899392 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:08,047 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.039350 grad_norm_before_clip: 0.899392 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:08,047 - TRAIN-LOGGER - INFO - Epoch 219 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.027723 +RANK_0 - 2026-01-29 06:17:14,687 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.035958 grad_norm_before_clip: 0.973533 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:15,949 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.035958 grad_norm_before_clip: 0.973533 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:15,950 - TRAIN-LOGGER - INFO - Epoch 220 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.026422 +RANK_0 - 2026-01-29 06:17:22,461 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.036456 grad_norm_before_clip: 1.220638 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:23,596 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.036456 grad_norm_before_clip: 1.220638 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:23,597 - TRAIN-LOGGER - INFO - Epoch 221 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882690 weight_norm_u: 25.222990 loss: 0.026215 +RANK_0 - 2026-01-29 06:17:30,475 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN - Minibatch 0: weight_norm_model: 143.882690 loss: 0.034640 grad_norm_before_clip: 0.782201 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:31,721 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882690 weight_norm_u: 25.218954 loss: 0.034640 grad_norm_before_clip: 0.782201 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:31,721 - TRAIN-LOGGER - INFO - Epoch 222 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.026493 +RANK_0 - 2026-01-29 06:17:38,202 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.034245 grad_norm_before_clip: 0.942380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:39,361 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.034245 grad_norm_before_clip: 0.942380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:39,361 - TRAIN-LOGGER - INFO - Epoch 223 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.026134 +RANK_0 - 2026-01-29 06:17:45,089 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.031035 grad_norm_before_clip: 0.907527 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:46,299 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.031035 grad_norm_before_clip: 0.907527 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:46,299 - TRAIN-LOGGER - INFO - Epoch 224 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.025676 +RANK_0 - 2026-01-29 06:17:52,624 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.031748 grad_norm_before_clip: 0.408103 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:53,884 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.031748 grad_norm_before_clip: 0.408103 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:53,885 - TRAIN-LOGGER - INFO - Epoch 225 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882782 weight_norm_u: 25.222990 loss: 0.026164 +RANK_0 - 2026-01-29 06:18:00,314 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN - Minibatch 0: weight_norm_model: 143.882782 loss: 0.036538 grad_norm_before_clip: 1.429953 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:01,593 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882782 weight_norm_u: 25.218954 loss: 0.036538 grad_norm_before_clip: 1.429953 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:01,594 - TRAIN-LOGGER - INFO - Epoch 226 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.026844 +RANK_0 - 2026-01-29 06:18:08,235 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.036655 grad_norm_before_clip: 1.421429 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:09,578 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.036655 grad_norm_before_clip: 1.421429 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:09,578 - TRAIN-LOGGER - INFO - Epoch 227 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882828 weight_norm_u: 25.222990 loss: 0.026381 +RANK_0 - 2026-01-29 06:18:15,953 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN - Minibatch 0: weight_norm_model: 143.882828 loss: 0.036800 grad_norm_before_clip: 2.150038 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:17,242 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882828 weight_norm_u: 25.218954 loss: 0.036800 grad_norm_before_clip: 2.150038 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:17,242 - TRAIN-LOGGER - INFO - Epoch 228 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.024797 +RANK_0 - 2026-01-29 06:18:23,143 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.027982 grad_norm_before_clip: 0.684177 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:24,505 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.027982 grad_norm_before_clip: 0.684177 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:24,505 - TRAIN-LOGGER - INFO - Epoch 229 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.023795 +RANK_0 - 2026-01-29 06:18:30,657 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.034487 grad_norm_before_clip: 1.194312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:31,875 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.034487 grad_norm_before_clip: 1.194312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:31,875 - TRAIN-LOGGER - INFO - Epoch 230 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.023733 +RANK_0 - 2026-01-29 06:18:38,746 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.031559 grad_norm_before_clip: 0.641286 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:39,995 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.031559 grad_norm_before_clip: 0.641286 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:39,996 - TRAIN-LOGGER - INFO - Epoch 231 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.024004 +RANK_0 - 2026-01-29 06:18:46,487 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.031616 grad_norm_before_clip: 0.643010 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:47,825 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.031616 grad_norm_before_clip: 0.643010 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:47,826 - TRAIN-LOGGER - INFO - Epoch 232 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882858 weight_norm_u: 25.222990 loss: 0.024834 +RANK_0 - 2026-01-29 06:18:55,288 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN - Minibatch 0: weight_norm_model: 143.882858 loss: 0.036894 grad_norm_before_clip: 1.578373 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:56,733 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882858 weight_norm_u: 25.218954 loss: 0.036894 grad_norm_before_clip: 1.578373 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:56,734 - TRAIN-LOGGER - INFO - Epoch 233 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.024637 +RANK_0 - 2026-01-29 06:19:04,249 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.037143 grad_norm_before_clip: 1.556531 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:05,745 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.037143 grad_norm_before_clip: 1.556531 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:05,745 - TRAIN-LOGGER - INFO - Epoch 234 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882919 weight_norm_u: 25.222990 loss: 0.023601 +RANK_0 - 2026-01-29 06:19:14,152 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN - Minibatch 0: weight_norm_model: 143.882919 loss: 0.028687 grad_norm_before_clip: 0.849561 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:15,445 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882919 weight_norm_u: 25.218954 loss: 0.028687 grad_norm_before_clip: 0.849561 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:15,445 - TRAIN-LOGGER - INFO - Epoch 235 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882965 weight_norm_u: 25.222990 loss: 0.022718 +RANK_0 - 2026-01-29 06:19:23,296 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN - Minibatch 0: weight_norm_model: 143.882965 loss: 0.033206 grad_norm_before_clip: 1.084353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:24,660 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882965 weight_norm_u: 25.218954 loss: 0.033206 grad_norm_before_clip: 1.084353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:24,660 - TRAIN-LOGGER - INFO - Epoch 236 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883026 weight_norm_u: 25.222990 loss: 0.024093 +RANK_0 - 2026-01-29 06:19:32,882 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN - Minibatch 0: weight_norm_model: 143.883026 loss: 0.037612 grad_norm_before_clip: 2.526495 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:34,583 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883026 weight_norm_u: 25.218954 loss: 0.037612 grad_norm_before_clip: 2.526495 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:34,583 - TRAIN-LOGGER - INFO - Epoch 237 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.025905 +RANK_0 - 2026-01-29 06:19:41,798 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.034560 grad_norm_before_clip: 1.542553 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:43,412 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.034560 grad_norm_before_clip: 1.542553 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:43,413 - TRAIN-LOGGER - INFO - Epoch 238 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.025849 +RANK_0 - 2026-01-29 06:19:51,927 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.040540 grad_norm_before_clip: 2.017598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:53,847 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.040540 grad_norm_before_clip: 2.017598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:53,847 - TRAIN-LOGGER - INFO - Epoch 239 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.024233 +RANK_0 - 2026-01-29 06:20:01,937 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.028671 grad_norm_before_clip: 1.587774 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:03,350 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.028671 grad_norm_before_clip: 1.587774 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:03,350 - TRAIN-LOGGER - INFO - Epoch 240 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.022174 +RANK_0 - 2026-01-29 06:20:12,070 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.027137 grad_norm_before_clip: 0.877698 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:13,492 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.027137 grad_norm_before_clip: 0.877698 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:13,492 - TRAIN-LOGGER - INFO - Epoch 241 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883072 weight_norm_u: 25.222990 loss: 0.021698 +RANK_0 - 2026-01-29 06:20:20,871 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN - Minibatch 0: weight_norm_model: 143.883072 loss: 0.035102 grad_norm_before_clip: 0.592797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:22,335 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883072 weight_norm_u: 25.218954 loss: 0.035102 grad_norm_before_clip: 0.592797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:22,335 - TRAIN-LOGGER - INFO - Epoch 242 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883072 weight_norm_u: 25.222990 loss: 0.023038 +RANK_0 - 2026-01-29 06:20:31,689 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN - Minibatch 0: weight_norm_model: 143.883072 loss: 0.028017 grad_norm_before_clip: 1.812115 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:33,194 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883072 weight_norm_u: 25.218954 loss: 0.028017 grad_norm_before_clip: 1.812115 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:33,194 - TRAIN-LOGGER - INFO - Epoch 243 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.023971 +RANK_0 - 2026-01-29 06:20:40,783 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.026936 grad_norm_before_clip: 1.758460 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:42,154 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.026936 grad_norm_before_clip: 1.758460 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:42,154 - TRAIN-LOGGER - INFO - Epoch 244 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883072 weight_norm_u: 25.222990 loss: 0.023911 +RANK_0 - 2026-01-29 06:20:50,611 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN - Minibatch 0: weight_norm_model: 143.883072 loss: 0.036144 grad_norm_before_clip: 1.513840 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:52,134 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883072 weight_norm_u: 25.218954 loss: 0.036144 grad_norm_before_clip: 1.513840 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:52,135 - TRAIN-LOGGER - INFO - Epoch 245 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883102 weight_norm_u: 25.222990 loss: 0.023368 +RANK_0 - 2026-01-29 06:21:01,733 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN - Minibatch 0: weight_norm_model: 143.883102 loss: 0.044253 grad_norm_before_clip: 2.007157 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:03,350 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883102 weight_norm_u: 25.218954 loss: 0.044253 grad_norm_before_clip: 2.007157 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:03,351 - TRAIN-LOGGER - INFO - Epoch 246 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.022645 +RANK_0 - 2026-01-29 06:21:11,665 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.026671 grad_norm_before_clip: 1.541921 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:13,357 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.026671 grad_norm_before_clip: 1.541921 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:13,357 - TRAIN-LOGGER - INFO - Epoch 247 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.022401 +RANK_0 - 2026-01-29 06:21:21,650 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.024712 grad_norm_before_clip: 0.701388 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:23,246 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.024712 grad_norm_before_clip: 0.701388 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:23,247 - TRAIN-LOGGER - INFO - Epoch 248 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883194 weight_norm_u: 25.222990 loss: 0.022572 +RANK_0 - 2026-01-29 06:21:31,700 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN - Minibatch 0: weight_norm_model: 143.883194 loss: 0.025486 grad_norm_before_clip: 0.825228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:33,374 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883194 weight_norm_u: 25.218954 loss: 0.025486 grad_norm_before_clip: 0.825228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:33,374 - TRAIN-LOGGER - INFO - Epoch 249 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.022554 +RANK_0 - 2026-01-29 06:21:41,687 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.036314 grad_norm_before_clip: 1.276713 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:43,138 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.036314 grad_norm_before_clip: 1.276713 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:43,139 - TRAIN-LOGGER - INFO - Epoch 250 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883240 weight_norm_u: 25.222990 loss: 0.022216 +RANK_0 - 2026-01-29 06:21:51,844 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN - Minibatch 0: weight_norm_model: 143.883240 loss: 0.028848 grad_norm_before_clip: 2.056568 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:53,135 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883240 weight_norm_u: 25.218954 loss: 0.028848 grad_norm_before_clip: 2.056568 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:53,136 - TRAIN-LOGGER - INFO - Epoch 251 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.021917 +RANK_0 - 2026-01-29 06:22:02,261 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.034324 grad_norm_before_clip: 1.048041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:03,617 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.034324 grad_norm_before_clip: 1.048041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:03,617 - TRAIN-LOGGER - INFO - Epoch 252 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.022360 +RANK_0 - 2026-01-29 06:22:11,735 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.033532 grad_norm_before_clip: 1.160440 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:13,482 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.033532 grad_norm_before_clip: 1.160440 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:13,482 - TRAIN-LOGGER - INFO - Epoch 253 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.022723 +RANK_0 - 2026-01-29 06:22:21,592 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.037679 grad_norm_before_clip: 3.035667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:23,516 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.037679 grad_norm_before_clip: 3.035667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:23,517 - TRAIN-LOGGER - INFO - Epoch 254 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.022610 +RANK_0 - 2026-01-29 06:22:31,871 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.027892 grad_norm_before_clip: 1.291915 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:33,655 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.027892 grad_norm_before_clip: 1.291915 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:33,655 - TRAIN-LOGGER - INFO - Epoch 255 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883240 weight_norm_u: 25.222990 loss: 0.021914 +RANK_0 - 2026-01-29 06:22:41,709 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN - Minibatch 0: weight_norm_model: 143.883240 loss: 0.030334 grad_norm_before_clip: 1.188066 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:43,448 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883240 weight_norm_u: 25.218954 loss: 0.030334 grad_norm_before_clip: 1.188066 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:43,449 - TRAIN-LOGGER - INFO - Epoch 256 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883255 weight_norm_u: 25.222990 loss: 0.021247 +RANK_0 - 2026-01-29 06:22:51,958 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN - Minibatch 0: weight_norm_model: 143.883255 loss: 0.027513 grad_norm_before_clip: 1.249340 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:53,429 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883255 weight_norm_u: 25.218954 loss: 0.027513 grad_norm_before_clip: 1.249340 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:53,430 - TRAIN-LOGGER - INFO - Epoch 257 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883301 weight_norm_u: 25.222990 loss: 0.020774 +RANK_0 - 2026-01-29 06:23:02,049 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN - Minibatch 0: weight_norm_model: 143.883301 loss: 0.031416 grad_norm_before_clip: 1.091362 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:03,311 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883301 weight_norm_u: 25.218954 loss: 0.031416 grad_norm_before_clip: 1.091362 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:03,311 - TRAIN-LOGGER - INFO - Epoch 258 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883316 weight_norm_u: 25.222990 loss: 0.020420 +RANK_0 - 2026-01-29 06:23:11,434 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN - Minibatch 0: weight_norm_model: 143.883316 loss: 0.029723 grad_norm_before_clip: 0.874723 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:13,125 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883316 weight_norm_u: 25.218954 loss: 0.029723 grad_norm_before_clip: 0.874723 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:13,126 - TRAIN-LOGGER - INFO - Epoch 259 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883347 weight_norm_u: 25.222990 loss: 0.019780 +RANK_0 - 2026-01-29 06:23:21,254 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN - Minibatch 0: weight_norm_model: 143.883347 loss: 0.027328 grad_norm_before_clip: 0.640642 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:22,681 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883347 weight_norm_u: 25.218954 loss: 0.027328 grad_norm_before_clip: 0.640642 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:22,681 - TRAIN-LOGGER - INFO - Epoch 260 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883377 weight_norm_u: 25.222990 loss: 0.019614 +RANK_0 - 2026-01-29 06:23:32,431 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN - Minibatch 0: weight_norm_model: 143.883377 loss: 0.029527 grad_norm_before_clip: 0.624046 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:33,650 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883377 weight_norm_u: 25.218954 loss: 0.029527 grad_norm_before_clip: 0.624046 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:33,650 - TRAIN-LOGGER - INFO - Epoch 261 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883392 weight_norm_u: 25.222990 loss: 0.020053 +RANK_0 - 2026-01-29 06:23:41,184 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN - Minibatch 0: weight_norm_model: 143.883392 loss: 0.028566 grad_norm_before_clip: 1.654964 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:42,497 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883392 weight_norm_u: 25.218954 loss: 0.028566 grad_norm_before_clip: 1.654964 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:42,498 - TRAIN-LOGGER - INFO - Epoch 262 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.020434 +RANK_0 - 2026-01-29 06:23:50,656 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.024347 grad_norm_before_clip: 0.776359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:52,130 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.024347 grad_norm_before_clip: 0.776359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:52,130 - TRAIN-LOGGER - INFO - Epoch 263 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.020203 +RANK_0 - 2026-01-29 06:24:00,927 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.034863 grad_norm_before_clip: 0.694872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:02,298 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.034863 grad_norm_before_clip: 0.694872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:02,298 - TRAIN-LOGGER - INFO - Epoch 264 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883438 weight_norm_u: 25.222990 loss: 0.019718 +RANK_0 - 2026-01-29 06:24:10,759 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN - Minibatch 0: weight_norm_model: 143.883438 loss: 0.024598 grad_norm_before_clip: 0.515095 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:12,178 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883438 weight_norm_u: 25.218954 loss: 0.024598 grad_norm_before_clip: 0.515095 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:12,179 - TRAIN-LOGGER - INFO - Epoch 265 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883453 weight_norm_u: 25.222990 loss: 0.019208 +RANK_0 - 2026-01-29 06:24:20,756 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN - Minibatch 0: weight_norm_model: 143.883453 loss: 0.031095 grad_norm_before_clip: 0.947601 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:22,225 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883453 weight_norm_u: 25.218954 loss: 0.031095 grad_norm_before_clip: 0.947601 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:22,226 - TRAIN-LOGGER - INFO - Epoch 266 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883469 weight_norm_u: 25.222990 loss: 0.019099 +RANK_0 - 2026-01-29 06:24:31,150 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN - Minibatch 0: weight_norm_model: 143.883469 loss: 0.023446 grad_norm_before_clip: 0.788825 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:32,662 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883469 weight_norm_u: 25.218954 loss: 0.023446 grad_norm_before_clip: 0.788825 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:32,662 - TRAIN-LOGGER - INFO - Epoch 267 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883484 weight_norm_u: 25.222990 loss: 0.019326 +RANK_0 - 2026-01-29 06:24:41,094 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN - Minibatch 0: weight_norm_model: 143.883484 loss: 0.026574 grad_norm_before_clip: 1.100778 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:42,573 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883484 weight_norm_u: 25.218954 loss: 0.026574 grad_norm_before_clip: 1.100778 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:42,574 - TRAIN-LOGGER - INFO - Epoch 268 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883514 weight_norm_u: 25.222990 loss: 0.019366 +RANK_0 - 2026-01-29 06:24:50,604 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN - Minibatch 0: weight_norm_model: 143.883514 loss: 0.030343 grad_norm_before_clip: 0.899641 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:52,291 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883514 weight_norm_u: 25.218954 loss: 0.030343 grad_norm_before_clip: 0.899641 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:52,291 - TRAIN-LOGGER - INFO - Epoch 269 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883514 weight_norm_u: 25.222990 loss: 0.019051 +RANK_0 - 2026-01-29 06:25:01,508 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN - Minibatch 0: weight_norm_model: 143.883514 loss: 0.033626 grad_norm_before_clip: 1.179606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:03,061 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883514 weight_norm_u: 25.218954 loss: 0.033626 grad_norm_before_clip: 1.179606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:03,061 - TRAIN-LOGGER - INFO - Epoch 270 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.019325 +RANK_0 - 2026-01-29 06:25:11,783 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.028269 grad_norm_before_clip: 0.638643 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:13,476 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.028269 grad_norm_before_clip: 0.638643 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:13,476 - TRAIN-LOGGER - INFO - Epoch 271 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.020009 +RANK_0 - 2026-01-29 06:25:22,093 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.026563 grad_norm_before_clip: 0.837013 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:23,738 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.026563 grad_norm_before_clip: 0.837013 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:23,739 - TRAIN-LOGGER - INFO - Epoch 272 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883575 weight_norm_u: 25.222990 loss: 0.020456 +RANK_0 - 2026-01-29 06:25:34,036 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN - Minibatch 0: weight_norm_model: 143.883575 loss: 0.030914 grad_norm_before_clip: 1.377878 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:35,433 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883575 weight_norm_u: 25.218954 loss: 0.030914 grad_norm_before_clip: 1.377878 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:35,433 - TRAIN-LOGGER - INFO - Epoch 273 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883606 weight_norm_u: 25.222990 loss: 0.020093 +RANK_0 - 2026-01-29 06:25:43,342 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN - Minibatch 0: weight_norm_model: 143.883606 loss: 0.027715 grad_norm_before_clip: 1.345277 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:44,948 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883606 weight_norm_u: 25.218954 loss: 0.027715 grad_norm_before_clip: 1.345277 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:44,948 - TRAIN-LOGGER - INFO - Epoch 274 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883652 weight_norm_u: 25.222990 loss: 0.019280 +RANK_0 - 2026-01-29 06:25:52,497 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN - Minibatch 0: weight_norm_model: 143.883652 loss: 0.027555 grad_norm_before_clip: 1.389945 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:53,788 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883652 weight_norm_u: 25.218954 loss: 0.027555 grad_norm_before_clip: 1.389945 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:53,789 - TRAIN-LOGGER - INFO - Epoch 275 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883682 weight_norm_u: 25.222990 loss: 0.018734 +RANK_0 - 2026-01-29 06:26:01,937 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN - Minibatch 0: weight_norm_model: 143.883682 loss: 0.027915 grad_norm_before_clip: 1.152060 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:03,203 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883682 weight_norm_u: 25.218954 loss: 0.027915 grad_norm_before_clip: 1.152060 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:03,203 - TRAIN-LOGGER - INFO - Epoch 276 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883728 weight_norm_u: 25.222990 loss: 0.018388 +RANK_0 - 2026-01-29 06:26:11,747 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN - Minibatch 0: weight_norm_model: 143.883728 loss: 0.035164 grad_norm_before_clip: 1.329578 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:13,265 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883728 weight_norm_u: 25.218954 loss: 0.035164 grad_norm_before_clip: 1.329578 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:13,266 - TRAIN-LOGGER - INFO - Epoch 277 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.017831 +RANK_0 - 2026-01-29 06:26:21,871 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.021576 grad_norm_before_clip: 0.723528 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:23,730 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.021576 grad_norm_before_clip: 0.723528 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:23,731 - TRAIN-LOGGER - INFO - Epoch 278 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.018213 +RANK_0 - 2026-01-29 06:26:32,480 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.022919 grad_norm_before_clip: 1.743294 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:34,095 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.022919 grad_norm_before_clip: 1.743294 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:34,095 - TRAIN-LOGGER - INFO - Epoch 279 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.018175 +RANK_0 - 2026-01-29 06:26:41,503 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.025009 grad_norm_before_clip: 1.264281 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:42,782 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.025009 grad_norm_before_clip: 1.264281 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:42,783 - TRAIN-LOGGER - INFO - Epoch 280 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883835 weight_norm_u: 25.222990 loss: 0.017891 +RANK_0 - 2026-01-29 06:26:49,937 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN - Minibatch 0: weight_norm_model: 143.883835 loss: 0.025350 grad_norm_before_clip: 1.467865 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:51,536 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883835 weight_norm_u: 25.218954 loss: 0.025350 grad_norm_before_clip: 1.467865 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:51,537 - TRAIN-LOGGER - INFO - Epoch 281 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.017466 +RANK_0 - 2026-01-29 06:27:00,483 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.022037 grad_norm_before_clip: 0.807202 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:01,786 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.022037 grad_norm_before_clip: 0.807202 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:01,787 - TRAIN-LOGGER - INFO - Epoch 282 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883865 weight_norm_u: 25.222990 loss: 0.017094 +RANK_0 - 2026-01-29 06:27:09,741 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN - Minibatch 0: weight_norm_model: 143.883865 loss: 0.023359 grad_norm_before_clip: 1.082619 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:11,025 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883865 weight_norm_u: 25.218954 loss: 0.023359 grad_norm_before_clip: 1.082619 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:11,025 - TRAIN-LOGGER - INFO - Epoch 283 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883896 weight_norm_u: 25.222990 loss: 0.016808 +RANK_0 - 2026-01-29 06:27:19,826 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN - Minibatch 0: weight_norm_model: 143.883896 loss: 0.022180 grad_norm_before_clip: 1.098451 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:21,458 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883896 weight_norm_u: 25.218954 loss: 0.022180 grad_norm_before_clip: 1.098451 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:21,458 - TRAIN-LOGGER - INFO - Epoch 284 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883911 weight_norm_u: 25.222990 loss: 0.016927 +RANK_0 - 2026-01-29 06:27:31,581 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN - Minibatch 0: weight_norm_model: 143.883911 loss: 0.020894 grad_norm_before_clip: 1.427075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:33,034 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883911 weight_norm_u: 25.218954 loss: 0.020894 grad_norm_before_clip: 1.427075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:33,035 - TRAIN-LOGGER - INFO - Epoch 285 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883926 weight_norm_u: 25.222990 loss: 0.016744 +RANK_0 - 2026-01-29 06:27:41,414 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN - Minibatch 0: weight_norm_model: 143.883926 loss: 0.026651 grad_norm_before_clip: 1.512306 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:42,884 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883926 weight_norm_u: 25.218954 loss: 0.026651 grad_norm_before_clip: 1.512306 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:42,884 - TRAIN-LOGGER - INFO - Epoch 286 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883942 weight_norm_u: 25.222990 loss: 0.016421 +RANK_0 - 2026-01-29 06:27:51,247 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN - Minibatch 0: weight_norm_model: 143.883942 loss: 0.026629 grad_norm_before_clip: 0.778149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:52,535 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883942 weight_norm_u: 25.218954 loss: 0.026629 grad_norm_before_clip: 0.778149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:52,535 - TRAIN-LOGGER - INFO - Epoch 287 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883972 weight_norm_u: 25.222990 loss: 0.016146 +RANK_0 - 2026-01-29 06:28:01,662 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN - Minibatch 0: weight_norm_model: 143.883972 loss: 0.026047 grad_norm_before_clip: 1.049872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:02,900 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883972 weight_norm_u: 25.218954 loss: 0.026047 grad_norm_before_clip: 1.049872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:02,900 - TRAIN-LOGGER - INFO - Epoch 288 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883987 weight_norm_u: 25.222990 loss: 0.016122 +RANK_0 - 2026-01-29 06:28:10,799 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN - Minibatch 0: weight_norm_model: 143.883987 loss: 0.025044 grad_norm_before_clip: 0.771801 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:12,218 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883987 weight_norm_u: 25.218954 loss: 0.025044 grad_norm_before_clip: 0.771801 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:12,219 - TRAIN-LOGGER - INFO - Epoch 289 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884033 weight_norm_u: 25.222990 loss: 0.016202 +RANK_0 - 2026-01-29 06:28:20,567 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN - Minibatch 0: weight_norm_model: 143.884033 loss: 0.026453 grad_norm_before_clip: 1.359103 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:21,964 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884033 weight_norm_u: 25.218954 loss: 0.026453 grad_norm_before_clip: 1.359103 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:21,964 - TRAIN-LOGGER - INFO - Epoch 290 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884064 weight_norm_u: 25.222990 loss: 0.016130 +RANK_0 - 2026-01-29 06:28:30,719 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN - Minibatch 0: weight_norm_model: 143.884064 loss: 0.024294 grad_norm_before_clip: 0.879554 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:32,306 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884064 weight_norm_u: 25.218954 loss: 0.024294 grad_norm_before_clip: 0.879554 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:32,306 - TRAIN-LOGGER - INFO - Epoch 291 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884109 weight_norm_u: 25.222990 loss: 0.016068 +RANK_0 - 2026-01-29 06:28:40,036 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN - Minibatch 0: weight_norm_model: 143.884109 loss: 0.023707 grad_norm_before_clip: 0.974670 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:41,570 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884109 weight_norm_u: 25.218954 loss: 0.023707 grad_norm_before_clip: 0.974670 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:41,570 - TRAIN-LOGGER - INFO - Epoch 292 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884140 weight_norm_u: 25.222990 loss: 0.015886 +RANK_0 - 2026-01-29 06:28:49,594 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN - Minibatch 0: weight_norm_model: 143.884140 loss: 0.026014 grad_norm_before_clip: 1.092059 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:51,027 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884140 weight_norm_u: 25.218954 loss: 0.026014 grad_norm_before_clip: 1.092059 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:51,027 - TRAIN-LOGGER - INFO - Epoch 293 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884155 weight_norm_u: 25.222990 loss: 0.016015 +RANK_0 - 2026-01-29 06:28:58,934 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN - Minibatch 0: weight_norm_model: 143.884155 loss: 0.017418 grad_norm_before_clip: 0.571003 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:00,436 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884155 weight_norm_u: 25.218954 loss: 0.017418 grad_norm_before_clip: 0.571003 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:00,436 - TRAIN-LOGGER - INFO - Epoch 294 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884155 weight_norm_u: 25.222990 loss: 0.016573 +RANK_0 - 2026-01-29 06:29:08,103 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN - Minibatch 0: weight_norm_model: 143.884155 loss: 0.028268 grad_norm_before_clip: 1.912754 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:09,893 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884155 weight_norm_u: 25.218954 loss: 0.028268 grad_norm_before_clip: 1.912754 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:09,893 - TRAIN-LOGGER - INFO - Epoch 295 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884171 weight_norm_u: 25.222990 loss: 0.016493 +RANK_0 - 2026-01-29 06:29:18,405 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN - Minibatch 0: weight_norm_model: 143.884171 loss: 0.026732 grad_norm_before_clip: 0.933277 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:19,864 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884171 weight_norm_u: 25.218954 loss: 0.026732 grad_norm_before_clip: 0.933277 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:19,864 - TRAIN-LOGGER - INFO - Epoch 296 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884201 weight_norm_u: 25.222990 loss: 0.015847 +RANK_0 - 2026-01-29 06:29:30,091 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN - Minibatch 0: weight_norm_model: 143.884201 loss: 0.020771 grad_norm_before_clip: 0.602456 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:31,565 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884201 weight_norm_u: 25.218954 loss: 0.020771 grad_norm_before_clip: 0.602456 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:31,565 - TRAIN-LOGGER - INFO - Epoch 297 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884232 weight_norm_u: 25.222990 loss: 0.015583 +RANK_0 - 2026-01-29 06:29:39,597 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN - Minibatch 0: weight_norm_model: 143.884232 loss: 0.020500 grad_norm_before_clip: 0.911745 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:41,128 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884232 weight_norm_u: 25.218954 loss: 0.020500 grad_norm_before_clip: 0.911745 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:41,128 - TRAIN-LOGGER - INFO - Epoch 298 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884262 weight_norm_u: 25.222990 loss: 0.015535 +RANK_0 - 2026-01-29 06:29:49,020 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN - Minibatch 0: weight_norm_model: 143.884262 loss: 0.023089 grad_norm_before_clip: 1.338794 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:50,707 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884262 weight_norm_u: 25.218954 loss: 0.023089 grad_norm_before_clip: 1.338794 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:50,707 - TRAIN-LOGGER - INFO - Epoch 299 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884293 weight_norm_u: 25.222990 loss: 0.015521 +RANK_0 - 2026-01-29 06:29:59,867 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN - Minibatch 0: weight_norm_model: 143.884293 loss: 0.021760 grad_norm_before_clip: 1.330818 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:01,558 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884293 weight_norm_u: 25.218954 loss: 0.021760 grad_norm_before_clip: 1.330818 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:01,558 - TRAIN-LOGGER - INFO - Epoch 300 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884338 weight_norm_u: 25.222990 loss: 0.015097 +RANK_0 - 2026-01-29 06:30:08,991 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN - Minibatch 0: weight_norm_model: 143.884338 loss: 0.025072 grad_norm_before_clip: 0.665851 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:10,695 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884338 weight_norm_u: 25.218954 loss: 0.025072 grad_norm_before_clip: 0.665851 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:10,695 - TRAIN-LOGGER - INFO - Epoch 301 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884384 weight_norm_u: 25.222990 loss: 0.014882 +RANK_0 - 2026-01-29 06:30:19,225 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN - Minibatch 0: weight_norm_model: 143.884384 loss: 0.020309 grad_norm_before_clip: 0.423546 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:20,773 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884384 weight_norm_u: 25.218954 loss: 0.020309 grad_norm_before_clip: 0.423546 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:20,774 - TRAIN-LOGGER - INFO - Epoch 302 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.015034 +RANK_0 - 2026-01-29 06:30:29,104 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.023755 grad_norm_before_clip: 1.135013 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:30,414 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.023755 grad_norm_before_clip: 1.135013 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:30,415 - TRAIN-LOGGER - INFO - Epoch 303 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884445 weight_norm_u: 25.222990 loss: 0.015743 +RANK_0 - 2026-01-29 06:30:39,044 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN - Minibatch 0: weight_norm_model: 143.884445 loss: 0.024024 grad_norm_before_clip: 0.968311 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:40,263 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884445 weight_norm_u: 25.218954 loss: 0.024024 grad_norm_before_clip: 0.968311 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:40,263 - TRAIN-LOGGER - INFO - Epoch 304 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884476 weight_norm_u: 25.222990 loss: 0.015047 +RANK_0 - 2026-01-29 06:30:49,169 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN - Minibatch 0: weight_norm_model: 143.884476 loss: 0.025267 grad_norm_before_clip: 1.218353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:50,928 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884476 weight_norm_u: 25.218954 loss: 0.025267 grad_norm_before_clip: 1.218353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:50,928 - TRAIN-LOGGER - INFO - Epoch 305 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884491 weight_norm_u: 25.222990 loss: 0.014189 +RANK_0 - 2026-01-29 06:31:00,027 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN - Minibatch 0: weight_norm_model: 143.884491 loss: 0.024403 grad_norm_before_clip: 1.086208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:01,410 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884491 weight_norm_u: 25.218954 loss: 0.024403 grad_norm_before_clip: 1.086208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:01,411 - TRAIN-LOGGER - INFO - Epoch 306 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884521 weight_norm_u: 25.222990 loss: 0.014081 +RANK_0 - 2026-01-29 06:31:09,898 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN - Minibatch 0: weight_norm_model: 143.884521 loss: 0.021666 grad_norm_before_clip: 1.180670 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:11,443 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884521 weight_norm_u: 25.218954 loss: 0.021666 grad_norm_before_clip: 1.180670 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:11,443 - TRAIN-LOGGER - INFO - Epoch 307 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884537 weight_norm_u: 25.222990 loss: 0.014948 +RANK_0 - 2026-01-29 06:31:20,680 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN - Minibatch 0: weight_norm_model: 143.884537 loss: 0.026562 grad_norm_before_clip: 1.579873 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:22,577 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884537 weight_norm_u: 25.218954 loss: 0.026562 grad_norm_before_clip: 1.579873 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:22,577 - TRAIN-LOGGER - INFO - Epoch 308 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884583 weight_norm_u: 25.222990 loss: 0.015101 +RANK_0 - 2026-01-29 06:31:31,423 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN - Minibatch 0: weight_norm_model: 143.884583 loss: 0.020356 grad_norm_before_clip: 2.255831 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:33,122 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884583 weight_norm_u: 25.218954 loss: 0.020356 grad_norm_before_clip: 2.255831 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:33,122 - TRAIN-LOGGER - INFO - Epoch 309 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884628 weight_norm_u: 25.222990 loss: 0.014010 +RANK_0 - 2026-01-29 06:31:40,439 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN - Minibatch 0: weight_norm_model: 143.884628 loss: 0.025964 grad_norm_before_clip: 1.907614 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:42,015 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884628 weight_norm_u: 25.218954 loss: 0.025964 grad_norm_before_clip: 1.907614 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:42,016 - TRAIN-LOGGER - INFO - Epoch 310 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884659 weight_norm_u: 25.222990 loss: 0.013551 +RANK_0 - 2026-01-29 06:31:50,609 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN - Minibatch 0: weight_norm_model: 143.884659 loss: 0.022060 grad_norm_before_clip: 1.519666 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:52,274 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884659 weight_norm_u: 25.218954 loss: 0.022060 grad_norm_before_clip: 1.519666 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:52,274 - TRAIN-LOGGER - INFO - Epoch 311 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884705 weight_norm_u: 25.222990 loss: 0.014159 +RANK_0 - 2026-01-29 06:32:00,556 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN - Minibatch 0: weight_norm_model: 143.884705 loss: 0.024130 grad_norm_before_clip: 1.414353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:02,080 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884705 weight_norm_u: 25.218954 loss: 0.024130 grad_norm_before_clip: 1.414353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:02,080 - TRAIN-LOGGER - INFO - Epoch 312 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884735 weight_norm_u: 25.222990 loss: 0.014654 +RANK_0 - 2026-01-29 06:32:10,697 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN - Minibatch 0: weight_norm_model: 143.884735 loss: 0.020286 grad_norm_before_clip: 1.019638 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:12,213 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884735 weight_norm_u: 25.218954 loss: 0.020286 grad_norm_before_clip: 1.019638 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:12,213 - TRAIN-LOGGER - INFO - Epoch 313 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884766 weight_norm_u: 25.222990 loss: 0.015513 +RANK_0 - 2026-01-29 06:32:20,710 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN - Minibatch 0: weight_norm_model: 143.884766 loss: 0.023776 grad_norm_before_clip: 1.065922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:22,440 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884766 weight_norm_u: 25.218954 loss: 0.023776 grad_norm_before_clip: 1.065922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:22,440 - TRAIN-LOGGER - INFO - Epoch 314 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884796 weight_norm_u: 25.222990 loss: 0.014865 +RANK_0 - 2026-01-29 06:32:31,347 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN - Minibatch 0: weight_norm_model: 143.884796 loss: 0.024016 grad_norm_before_clip: 1.299114 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:32,735 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884796 weight_norm_u: 25.218954 loss: 0.024016 grad_norm_before_clip: 1.299114 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:32,736 - TRAIN-LOGGER - INFO - Epoch 315 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884811 weight_norm_u: 25.222990 loss: 0.013744 +RANK_0 - 2026-01-29 06:32:40,907 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN - Minibatch 0: weight_norm_model: 143.884811 loss: 0.017634 grad_norm_before_clip: 1.018610 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:42,480 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884811 weight_norm_u: 25.218954 loss: 0.017634 grad_norm_before_clip: 1.018610 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:42,481 - TRAIN-LOGGER - INFO - Epoch 316 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884827 weight_norm_u: 25.222990 loss: 0.014230 +RANK_0 - 2026-01-29 06:32:50,634 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN - Minibatch 0: weight_norm_model: 143.884827 loss: 0.025935 grad_norm_before_clip: 0.702949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:52,226 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884827 weight_norm_u: 25.218954 loss: 0.025935 grad_norm_before_clip: 0.702949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:52,226 - TRAIN-LOGGER - INFO - Epoch 317 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884842 weight_norm_u: 25.222990 loss: 0.015881 +RANK_0 - 2026-01-29 06:33:01,400 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN - Minibatch 0: weight_norm_model: 143.884842 loss: 0.021242 grad_norm_before_clip: 1.950198 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:02,987 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884842 weight_norm_u: 25.218954 loss: 0.021242 grad_norm_before_clip: 1.950198 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:02,988 - TRAIN-LOGGER - INFO - Epoch 318 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884857 weight_norm_u: 25.222990 loss: 0.017189 +RANK_0 - 2026-01-29 06:33:10,383 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN - Minibatch 0: weight_norm_model: 143.884857 loss: 0.024124 grad_norm_before_clip: 1.655797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:11,813 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884857 weight_norm_u: 25.218954 loss: 0.024124 grad_norm_before_clip: 1.655797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:11,814 - TRAIN-LOGGER - INFO - Epoch 319 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884888 weight_norm_u: 25.222990 loss: 0.016806 +RANK_0 - 2026-01-29 06:33:20,299 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN - Minibatch 0: weight_norm_model: 143.884888 loss: 0.023414 grad_norm_before_clip: 1.871309 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:21,851 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884888 weight_norm_u: 25.218954 loss: 0.023414 grad_norm_before_clip: 1.871309 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:21,852 - TRAIN-LOGGER - INFO - Epoch 320 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884903 weight_norm_u: 25.222990 loss: 0.015084 +RANK_0 - 2026-01-29 06:33:31,709 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN - Minibatch 0: weight_norm_model: 143.884903 loss: 0.021509 grad_norm_before_clip: 0.914526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:33,522 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884903 weight_norm_u: 25.218954 loss: 0.021509 grad_norm_before_clip: 0.914526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:33,523 - TRAIN-LOGGER - INFO - Epoch 321 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884933 weight_norm_u: 25.222990 loss: 0.013999 +RANK_0 - 2026-01-29 06:33:42,258 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN - Minibatch 0: weight_norm_model: 143.884933 loss: 0.021558 grad_norm_before_clip: 0.849473 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:44,004 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884933 weight_norm_u: 25.218954 loss: 0.021558 grad_norm_before_clip: 0.849473 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:44,005 - TRAIN-LOGGER - INFO - Epoch 322 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884979 weight_norm_u: 25.222990 loss: 0.013910 +RANK_0 - 2026-01-29 06:33:51,756 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN - Minibatch 0: weight_norm_model: 143.884979 loss: 0.022326 grad_norm_before_clip: 1.881486 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:52,992 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884979 weight_norm_u: 25.218954 loss: 0.022326 grad_norm_before_clip: 1.881486 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:52,992 - TRAIN-LOGGER - INFO - Epoch 323 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885010 weight_norm_u: 25.222990 loss: 0.014014 +RANK_0 - 2026-01-29 06:34:00,793 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN - Minibatch 0: weight_norm_model: 143.885010 loss: 0.022159 grad_norm_before_clip: 0.858784 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:02,219 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885010 weight_norm_u: 25.218954 loss: 0.022159 grad_norm_before_clip: 0.858784 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:02,220 - TRAIN-LOGGER - INFO - Epoch 324 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885056 weight_norm_u: 25.222990 loss: 0.013892 +RANK_0 - 2026-01-29 06:34:11,019 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN - Minibatch 0: weight_norm_model: 143.885056 loss: 0.024098 grad_norm_before_clip: 2.325926 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:12,293 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885056 weight_norm_u: 25.218954 loss: 0.024098 grad_norm_before_clip: 2.325926 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:12,294 - TRAIN-LOGGER - INFO - Epoch 325 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.013417 +RANK_0 - 2026-01-29 06:34:20,944 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.020158 grad_norm_before_clip: 0.963795 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:22,613 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.020158 grad_norm_before_clip: 0.963795 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:22,614 - TRAIN-LOGGER - INFO - Epoch 326 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885117 weight_norm_u: 25.222990 loss: 0.013109 +RANK_0 - 2026-01-29 06:34:31,115 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN - Minibatch 0: weight_norm_model: 143.885117 loss: 0.024019 grad_norm_before_clip: 1.785885 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:32,512 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885117 weight_norm_u: 25.218954 loss: 0.024019 grad_norm_before_clip: 1.785885 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:32,512 - TRAIN-LOGGER - INFO - Epoch 327 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885132 weight_norm_u: 25.222990 loss: 0.013227 +RANK_0 - 2026-01-29 06:34:40,473 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN - Minibatch 0: weight_norm_model: 143.885132 loss: 0.021337 grad_norm_before_clip: 1.486191 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:41,911 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885132 weight_norm_u: 25.218954 loss: 0.021337 grad_norm_before_clip: 1.486191 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:41,912 - TRAIN-LOGGER - INFO - Epoch 328 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885132 weight_norm_u: 25.222990 loss: 0.013064 +RANK_0 - 2026-01-29 06:34:50,846 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN - Minibatch 0: weight_norm_model: 143.885132 loss: 0.017565 grad_norm_before_clip: 1.073020 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:52,375 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885132 weight_norm_u: 25.218954 loss: 0.017565 grad_norm_before_clip: 1.073020 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:52,375 - TRAIN-LOGGER - INFO - Epoch 329 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885147 weight_norm_u: 25.222990 loss: 0.012694 +RANK_0 - 2026-01-29 06:35:01,501 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN - Minibatch 0: weight_norm_model: 143.885147 loss: 0.019748 grad_norm_before_clip: 0.567474 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:02,730 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885147 weight_norm_u: 25.218954 loss: 0.019748 grad_norm_before_clip: 0.567474 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:02,730 - TRAIN-LOGGER - INFO - Epoch 330 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885147 weight_norm_u: 25.222990 loss: 0.012602 +RANK_0 - 2026-01-29 06:35:10,301 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN - Minibatch 0: weight_norm_model: 143.885147 loss: 0.016720 grad_norm_before_clip: 0.660340 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:11,758 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885147 weight_norm_u: 25.218954 loss: 0.016720 grad_norm_before_clip: 0.660340 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:11,758 - TRAIN-LOGGER - INFO - Epoch 331 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885178 weight_norm_u: 25.222990 loss: 0.012732 +RANK_0 - 2026-01-29 06:35:19,627 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN - Minibatch 0: weight_norm_model: 143.885178 loss: 0.019106 grad_norm_before_clip: 1.338406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:20,881 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885178 weight_norm_u: 25.218954 loss: 0.019106 grad_norm_before_clip: 1.338406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:20,882 - TRAIN-LOGGER - INFO - Epoch 332 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885193 weight_norm_u: 25.222990 loss: 0.012668 +RANK_0 - 2026-01-29 06:35:28,177 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN - Minibatch 0: weight_norm_model: 143.885193 loss: 0.018807 grad_norm_before_clip: 0.957135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:29,608 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885193 weight_norm_u: 25.218954 loss: 0.018807 grad_norm_before_clip: 0.957135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:29,608 - TRAIN-LOGGER - INFO - Epoch 333 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885223 weight_norm_u: 25.222990 loss: 0.012641 +RANK_0 - 2026-01-29 06:35:36,616 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN - Minibatch 0: weight_norm_model: 143.885223 loss: 0.022719 grad_norm_before_clip: 1.188577 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:37,886 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885223 weight_norm_u: 25.218954 loss: 0.022719 grad_norm_before_clip: 1.188577 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:37,886 - TRAIN-LOGGER - INFO - Epoch 334 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885254 weight_norm_u: 25.222990 loss: 0.012263 +RANK_0 - 2026-01-29 06:35:44,626 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN - Minibatch 0: weight_norm_model: 143.885254 loss: 0.020856 grad_norm_before_clip: 0.829767 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:45,787 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885254 weight_norm_u: 25.218954 loss: 0.020856 grad_norm_before_clip: 0.829767 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:45,788 - TRAIN-LOGGER - INFO - Epoch 335 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885300 weight_norm_u: 25.222990 loss: 0.012177 +RANK_0 - 2026-01-29 06:35:53,871 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN - Minibatch 0: weight_norm_model: 143.885300 loss: 0.017074 grad_norm_before_clip: 0.898678 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:54,971 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885300 weight_norm_u: 25.218954 loss: 0.017074 grad_norm_before_clip: 0.898678 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:54,971 - TRAIN-LOGGER - INFO - Epoch 336 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885345 weight_norm_u: 25.222990 loss: 0.012079 +RANK_0 - 2026-01-29 06:36:02,138 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN - Minibatch 0: weight_norm_model: 143.885345 loss: 0.022247 grad_norm_before_clip: 1.845953 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:03,292 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885345 weight_norm_u: 25.218954 loss: 0.022247 grad_norm_before_clip: 1.845953 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:03,292 - TRAIN-LOGGER - INFO - Epoch 337 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885391 weight_norm_u: 25.222990 loss: 0.011690 +RANK_0 - 2026-01-29 06:36:10,697 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN - Minibatch 0: weight_norm_model: 143.885391 loss: 0.017774 grad_norm_before_clip: 0.498073 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:11,954 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885391 weight_norm_u: 25.218954 loss: 0.017774 grad_norm_before_clip: 0.498073 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:11,955 - TRAIN-LOGGER - INFO - Epoch 338 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885406 weight_norm_u: 25.222990 loss: 0.011638 +RANK_0 - 2026-01-29 06:36:19,692 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN - Minibatch 0: weight_norm_model: 143.885406 loss: 0.027509 grad_norm_before_clip: 0.811899 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:21,125 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885406 weight_norm_u: 25.218954 loss: 0.027509 grad_norm_before_clip: 0.811899 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:21,125 - TRAIN-LOGGER - INFO - Epoch 339 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885437 weight_norm_u: 25.222990 loss: 0.012017 +RANK_0 - 2026-01-29 06:36:28,825 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN - Minibatch 0: weight_norm_model: 143.885437 loss: 0.020804 grad_norm_before_clip: 2.181888 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:30,305 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885437 weight_norm_u: 25.218954 loss: 0.020804 grad_norm_before_clip: 2.181888 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:30,306 - TRAIN-LOGGER - INFO - Epoch 340 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885452 weight_norm_u: 25.222990 loss: 0.012065 +RANK_0 - 2026-01-29 06:36:37,810 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN - Minibatch 0: weight_norm_model: 143.885452 loss: 0.021629 grad_norm_before_clip: 1.075059 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:39,438 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885452 weight_norm_u: 25.218954 loss: 0.021629 grad_norm_before_clip: 1.075059 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:39,439 - TRAIN-LOGGER - INFO - Epoch 341 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885468 weight_norm_u: 25.222990 loss: 0.011794 +RANK_0 - 2026-01-29 06:36:47,277 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN - Minibatch 0: weight_norm_model: 143.885468 loss: 0.019038 grad_norm_before_clip: 1.815610 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:48,527 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885468 weight_norm_u: 25.218954 loss: 0.019038 grad_norm_before_clip: 1.815610 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:48,527 - TRAIN-LOGGER - INFO - Epoch 342 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885483 weight_norm_u: 25.222990 loss: 0.011734 +RANK_0 - 2026-01-29 06:36:55,819 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN - Minibatch 0: weight_norm_model: 143.885483 loss: 0.020019 grad_norm_before_clip: 2.078596 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:57,157 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885483 weight_norm_u: 25.218954 loss: 0.020019 grad_norm_before_clip: 2.078596 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:36:57,157 - TRAIN-LOGGER - INFO - Epoch 343 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885498 weight_norm_u: 25.222990 loss: 0.011512 +RANK_0 - 2026-01-29 06:37:05,002 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN - Minibatch 0: weight_norm_model: 143.885498 loss: 0.022766 grad_norm_before_clip: 1.262144 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:06,335 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885498 weight_norm_u: 25.218954 loss: 0.022766 grad_norm_before_clip: 1.262144 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:06,335 - TRAIN-LOGGER - INFO - Epoch 344 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.011591 +RANK_0 - 2026-01-29 06:37:12,603 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.016163 grad_norm_before_clip: 1.283363 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:13,897 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.016163 grad_norm_before_clip: 1.283363 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:13,897 - TRAIN-LOGGER - INFO - Epoch 345 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.011620 +RANK_0 - 2026-01-29 06:37:21,688 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.019813 grad_norm_before_clip: 1.523711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:22,986 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.019813 grad_norm_before_clip: 1.523711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:22,986 - TRAIN-LOGGER - INFO - Epoch 346 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885590 weight_norm_u: 25.222990 loss: 0.011451 +RANK_0 - 2026-01-29 06:37:30,110 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN - Minibatch 0: weight_norm_model: 143.885590 loss: 0.019002 grad_norm_before_clip: 1.156227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:31,475 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885590 weight_norm_u: 25.218954 loss: 0.019002 grad_norm_before_clip: 1.156227 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:31,475 - TRAIN-LOGGER - INFO - Epoch 347 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885605 weight_norm_u: 25.222990 loss: 0.011345 +RANK_0 - 2026-01-29 06:37:38,258 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN - Minibatch 0: weight_norm_model: 143.885605 loss: 0.018902 grad_norm_before_clip: 0.997681 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:39,541 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885605 weight_norm_u: 25.218954 loss: 0.018902 grad_norm_before_clip: 0.997681 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:39,541 - TRAIN-LOGGER - INFO - Epoch 348 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885635 weight_norm_u: 25.222990 loss: 0.011485 +RANK_0 - 2026-01-29 06:37:46,339 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN - Minibatch 0: weight_norm_model: 143.885635 loss: 0.017927 grad_norm_before_clip: 1.136050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:47,836 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885635 weight_norm_u: 25.218954 loss: 0.017927 grad_norm_before_clip: 1.136050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:47,836 - TRAIN-LOGGER - INFO - Epoch 349 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885666 weight_norm_u: 25.222990 loss: 0.011217 +RANK_0 - 2026-01-29 06:37:53,946 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN - Minibatch 0: weight_norm_model: 143.885666 loss: 0.017290 grad_norm_before_clip: 1.148602 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:55,134 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885666 weight_norm_u: 25.218954 loss: 0.017290 grad_norm_before_clip: 1.148602 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:37:55,134 - TRAIN-LOGGER - INFO - Epoch 350 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885681 weight_norm_u: 25.222990 loss: 0.011411 +RANK_0 - 2026-01-29 06:38:00,755 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN - Minibatch 0: weight_norm_model: 143.885681 loss: 0.016087 grad_norm_before_clip: 0.751471 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:01,970 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885681 weight_norm_u: 25.218954 loss: 0.016087 grad_norm_before_clip: 0.751471 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:01,970 - TRAIN-LOGGER - INFO - Epoch 351 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885712 weight_norm_u: 25.222990 loss: 0.012079 +RANK_0 - 2026-01-29 06:38:08,432 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN - Minibatch 0: weight_norm_model: 143.885712 loss: 0.020120 grad_norm_before_clip: 1.452802 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:09,565 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885712 weight_norm_u: 25.218954 loss: 0.020120 grad_norm_before_clip: 1.452802 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:09,565 - TRAIN-LOGGER - INFO - Epoch 352 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885742 weight_norm_u: 25.222990 loss: 0.012307 +RANK_0 - 2026-01-29 06:38:15,908 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN - Minibatch 0: weight_norm_model: 143.885742 loss: 0.018887 grad_norm_before_clip: 1.687139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:17,101 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885742 weight_norm_u: 25.218954 loss: 0.018887 grad_norm_before_clip: 1.687139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:17,101 - TRAIN-LOGGER - INFO - Epoch 353 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885773 weight_norm_u: 25.222990 loss: 0.011529 +RANK_0 - 2026-01-29 06:38:23,048 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN - Minibatch 0: weight_norm_model: 143.885773 loss: 0.017709 grad_norm_before_clip: 0.970114 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:24,205 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885773 weight_norm_u: 25.218954 loss: 0.017709 grad_norm_before_clip: 0.970114 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:24,205 - TRAIN-LOGGER - INFO - Epoch 354 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885788 weight_norm_u: 25.222990 loss: 0.010740 +RANK_0 - 2026-01-29 06:38:30,835 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN - Minibatch 0: weight_norm_model: 143.885788 loss: 0.017288 grad_norm_before_clip: 0.935165 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:32,160 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885788 weight_norm_u: 25.218954 loss: 0.017288 grad_norm_before_clip: 0.935165 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:32,160 - TRAIN-LOGGER - INFO - Epoch 355 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.010432 +RANK_0 - 2026-01-29 06:38:39,048 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.018549 grad_norm_before_clip: 0.864425 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:40,346 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.018549 grad_norm_before_clip: 0.864425 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:40,346 - TRAIN-LOGGER - INFO - Epoch 356 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885849 weight_norm_u: 25.222990 loss: 0.010648 +RANK_0 - 2026-01-29 06:38:47,313 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN - Minibatch 0: weight_norm_model: 143.885849 loss: 0.019141 grad_norm_before_clip: 1.242254 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:48,712 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885849 weight_norm_u: 25.218954 loss: 0.019141 grad_norm_before_clip: 1.242254 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:48,712 - TRAIN-LOGGER - INFO - Epoch 357 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885864 weight_norm_u: 25.222990 loss: 0.010745 +RANK_0 - 2026-01-29 06:38:55,818 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN - Minibatch 0: weight_norm_model: 143.885864 loss: 0.019055 grad_norm_before_clip: 1.423969 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:57,016 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885864 weight_norm_u: 25.218954 loss: 0.019055 grad_norm_before_clip: 1.423969 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:38:57,016 - TRAIN-LOGGER - INFO - Epoch 358 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885864 weight_norm_u: 25.222990 loss: 0.011126 +RANK_0 - 2026-01-29 06:39:03,558 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN - Minibatch 0: weight_norm_model: 143.885864 loss: 0.016302 grad_norm_before_clip: 0.921555 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:04,835 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885864 weight_norm_u: 25.218954 loss: 0.016302 grad_norm_before_clip: 0.921555 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:04,836 - TRAIN-LOGGER - INFO - Epoch 359 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885880 weight_norm_u: 25.222990 loss: 0.011415 +RANK_0 - 2026-01-29 06:39:11,319 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN - Minibatch 0: weight_norm_model: 143.885880 loss: 0.020207 grad_norm_before_clip: 1.224129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:12,453 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885880 weight_norm_u: 25.218954 loss: 0.020207 grad_norm_before_clip: 1.224129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:12,453 - TRAIN-LOGGER - INFO - Epoch 360 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885910 weight_norm_u: 25.222990 loss: 0.011635 +RANK_0 - 2026-01-29 06:39:19,047 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN - Minibatch 0: weight_norm_model: 143.885910 loss: 0.018922 grad_norm_before_clip: 1.572691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:20,307 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885910 weight_norm_u: 25.218954 loss: 0.018922 grad_norm_before_clip: 1.572691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:20,308 - TRAIN-LOGGER - INFO - Epoch 361 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885956 weight_norm_u: 25.222990 loss: 0.011482 +RANK_0 - 2026-01-29 06:39:27,021 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN - Minibatch 0: weight_norm_model: 143.885956 loss: 0.016937 grad_norm_before_clip: 1.151972 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:28,265 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885956 weight_norm_u: 25.218954 loss: 0.016937 grad_norm_before_clip: 1.151972 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:28,266 - TRAIN-LOGGER - INFO - Epoch 362 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886002 weight_norm_u: 25.222990 loss: 0.010967 +RANK_0 - 2026-01-29 06:39:34,972 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN - Minibatch 0: weight_norm_model: 143.886002 loss: 0.017856 grad_norm_before_clip: 1.177799 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:36,084 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886002 weight_norm_u: 25.218954 loss: 0.017856 grad_norm_before_clip: 1.177799 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:36,084 - TRAIN-LOGGER - INFO - Epoch 363 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886047 weight_norm_u: 25.222990 loss: 0.010270 +RANK_0 - 2026-01-29 06:39:42,181 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN - Minibatch 0: weight_norm_model: 143.886047 loss: 0.014344 grad_norm_before_clip: 0.548594 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:43,415 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886047 weight_norm_u: 25.218954 loss: 0.014344 grad_norm_before_clip: 0.548594 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:43,415 - TRAIN-LOGGER - INFO - Epoch 364 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886093 weight_norm_u: 25.222990 loss: 0.010458 +RANK_0 - 2026-01-29 06:39:49,824 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN - Minibatch 0: weight_norm_model: 143.886093 loss: 0.015360 grad_norm_before_clip: 0.944395 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:51,069 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886093 weight_norm_u: 25.218954 loss: 0.015360 grad_norm_before_clip: 0.944395 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:51,069 - TRAIN-LOGGER - INFO - Epoch 365 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.010391 +RANK_0 - 2026-01-29 06:39:58,216 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.016849 grad_norm_before_clip: 1.293263 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:59,715 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.016849 grad_norm_before_clip: 1.293263 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:39:59,716 - TRAIN-LOGGER - INFO - Epoch 366 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886154 weight_norm_u: 25.222990 loss: 0.009825 +RANK_0 - 2026-01-29 06:40:06,817 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN - Minibatch 0: weight_norm_model: 143.886154 loss: 0.016493 grad_norm_before_clip: 0.938129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:08,128 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886154 weight_norm_u: 25.218954 loss: 0.016493 grad_norm_before_clip: 0.938129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:08,128 - TRAIN-LOGGER - INFO - Epoch 367 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886185 weight_norm_u: 25.222990 loss: 0.009543 +RANK_0 - 2026-01-29 06:40:14,066 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN - Minibatch 0: weight_norm_model: 143.886185 loss: 0.011233 grad_norm_before_clip: 0.347552 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:15,200 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886185 weight_norm_u: 25.218954 loss: 0.011233 grad_norm_before_clip: 0.347552 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:15,200 - TRAIN-LOGGER - INFO - Epoch 368 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886200 weight_norm_u: 25.222990 loss: 0.010139 +RANK_0 - 2026-01-29 06:40:21,704 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN - Minibatch 0: weight_norm_model: 143.886200 loss: 0.015787 grad_norm_before_clip: 1.180021 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:22,887 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886200 weight_norm_u: 25.218954 loss: 0.015787 grad_norm_before_clip: 1.180021 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:22,888 - TRAIN-LOGGER - INFO - Epoch 369 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886246 weight_norm_u: 25.222990 loss: 0.010265 +RANK_0 - 2026-01-29 06:40:29,577 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN - Minibatch 0: weight_norm_model: 143.886246 loss: 0.016075 grad_norm_before_clip: 0.740706 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:30,839 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886246 weight_norm_u: 25.218954 loss: 0.016075 grad_norm_before_clip: 0.740706 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:30,839 - TRAIN-LOGGER - INFO - Epoch 370 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886261 weight_norm_u: 25.222990 loss: 0.010193 +RANK_0 - 2026-01-29 06:40:37,631 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN - Minibatch 0: weight_norm_model: 143.886261 loss: 0.019777 grad_norm_before_clip: 1.066838 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:38,890 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886261 weight_norm_u: 25.218954 loss: 0.019777 grad_norm_before_clip: 1.066838 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:38,890 - TRAIN-LOGGER - INFO - Epoch 371 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886292 weight_norm_u: 25.222990 loss: 0.009809 +RANK_0 - 2026-01-29 06:40:45,495 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN - Minibatch 0: weight_norm_model: 143.886292 loss: 0.020089 grad_norm_before_clip: 0.924940 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:46,643 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886292 weight_norm_u: 25.218954 loss: 0.020089 grad_norm_before_clip: 0.924940 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:46,643 - TRAIN-LOGGER - INFO - Epoch 372 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886337 weight_norm_u: 25.222990 loss: 0.010311 +RANK_0 - 2026-01-29 06:40:53,648 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN - Minibatch 0: weight_norm_model: 143.886337 loss: 0.019317 grad_norm_before_clip: 1.814615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:54,758 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886337 weight_norm_u: 25.218954 loss: 0.019317 grad_norm_before_clip: 1.814615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:40:54,758 - TRAIN-LOGGER - INFO - Epoch 373 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886368 weight_norm_u: 25.222990 loss: 0.010647 +RANK_0 - 2026-01-29 06:41:00,970 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN - Minibatch 0: weight_norm_model: 143.886368 loss: 0.015633 grad_norm_before_clip: 1.210129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:02,254 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886368 weight_norm_u: 25.218954 loss: 0.015633 grad_norm_before_clip: 1.210129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:02,254 - TRAIN-LOGGER - INFO - Epoch 374 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886383 weight_norm_u: 25.222990 loss: 0.009906 +RANK_0 - 2026-01-29 06:41:09,646 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN - Minibatch 0: weight_norm_model: 143.886383 loss: 0.015212 grad_norm_before_clip: 1.277565 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:10,923 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886383 weight_norm_u: 25.218954 loss: 0.015212 grad_norm_before_clip: 1.277565 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:10,923 - TRAIN-LOGGER - INFO - Epoch 375 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886414 weight_norm_u: 25.222990 loss: 0.009465 +RANK_0 - 2026-01-29 06:41:18,084 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN - Minibatch 0: weight_norm_model: 143.886414 loss: 0.015718 grad_norm_before_clip: 1.009454 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:19,361 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886414 weight_norm_u: 25.218954 loss: 0.015718 grad_norm_before_clip: 1.009454 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:19,361 - TRAIN-LOGGER - INFO - Epoch 376 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886444 weight_norm_u: 25.222990 loss: 0.009820 +RANK_0 - 2026-01-29 06:41:25,954 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN - Minibatch 0: weight_norm_model: 143.886444 loss: 0.016372 grad_norm_before_clip: 1.021015 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:27,177 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886444 weight_norm_u: 25.218954 loss: 0.016372 grad_norm_before_clip: 1.021015 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:27,177 - TRAIN-LOGGER - INFO - Epoch 377 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886459 weight_norm_u: 25.222990 loss: 0.010902 +RANK_0 - 2026-01-29 06:41:32,785 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN - Minibatch 0: weight_norm_model: 143.886459 loss: 0.016289 grad_norm_before_clip: 0.964309 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:33,896 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886459 weight_norm_u: 25.218954 loss: 0.016289 grad_norm_before_clip: 0.964309 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:33,896 - TRAIN-LOGGER - INFO - Epoch 378 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886475 weight_norm_u: 25.222990 loss: 0.011868 +RANK_0 - 2026-01-29 06:41:40,468 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN - Minibatch 0: weight_norm_model: 143.886475 loss: 0.024339 grad_norm_before_clip: 2.933733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:41,702 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886475 weight_norm_u: 25.218954 loss: 0.024339 grad_norm_before_clip: 2.933733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:41,702 - TRAIN-LOGGER - INFO - Epoch 379 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886475 weight_norm_u: 25.222990 loss: 0.011997 +RANK_0 - 2026-01-29 06:41:48,377 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN - Minibatch 0: weight_norm_model: 143.886475 loss: 0.019685 grad_norm_before_clip: 1.228557 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:49,622 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886475 weight_norm_u: 25.218954 loss: 0.019685 grad_norm_before_clip: 1.228557 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:49,622 - TRAIN-LOGGER - INFO - Epoch 380 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886490 weight_norm_u: 25.222990 loss: 0.010884 +RANK_0 - 2026-01-29 06:41:56,508 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN - Minibatch 0: weight_norm_model: 143.886490 loss: 0.018642 grad_norm_before_clip: 1.878325 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:57,756 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886490 weight_norm_u: 25.218954 loss: 0.018642 grad_norm_before_clip: 1.878325 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:41:57,756 - TRAIN-LOGGER - INFO - Epoch 381 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886490 weight_norm_u: 25.222990 loss: 0.010004 +RANK_0 - 2026-01-29 06:42:04,235 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN - Minibatch 0: weight_norm_model: 143.886490 loss: 0.016256 grad_norm_before_clip: 1.535150 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:05,359 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886490 weight_norm_u: 25.218954 loss: 0.016256 grad_norm_before_clip: 1.535150 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:05,359 - TRAIN-LOGGER - INFO - Epoch 382 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886505 weight_norm_u: 25.222990 loss: 0.009731 +RANK_0 - 2026-01-29 06:42:11,190 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN - Minibatch 0: weight_norm_model: 143.886505 loss: 0.017998 grad_norm_before_clip: 0.818067 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:12,395 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886505 weight_norm_u: 25.218954 loss: 0.017998 grad_norm_before_clip: 0.818067 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:12,395 - TRAIN-LOGGER - INFO - Epoch 383 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886505 weight_norm_u: 25.222990 loss: 0.010361 +RANK_0 - 2026-01-29 06:42:19,221 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN - Minibatch 0: weight_norm_model: 143.886505 loss: 0.017802 grad_norm_before_clip: 1.668149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:20,561 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886505 weight_norm_u: 25.218954 loss: 0.017802 grad_norm_before_clip: 1.668149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:20,561 - TRAIN-LOGGER - INFO - Epoch 384 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886536 weight_norm_u: 25.222990 loss: 0.011094 +RANK_0 - 2026-01-29 06:42:26,974 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN - Minibatch 0: weight_norm_model: 143.886536 loss: 0.017205 grad_norm_before_clip: 1.441930 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:28,305 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886536 weight_norm_u: 25.218954 loss: 0.017205 grad_norm_before_clip: 1.441930 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:28,305 - TRAIN-LOGGER - INFO - Epoch 385 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886536 weight_norm_u: 25.222990 loss: 0.011045 +RANK_0 - 2026-01-29 06:42:34,765 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN - Minibatch 0: weight_norm_model: 143.886536 loss: 0.015947 grad_norm_before_clip: 0.782879 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:36,050 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886536 weight_norm_u: 25.218954 loss: 0.015947 grad_norm_before_clip: 0.782879 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:36,050 - TRAIN-LOGGER - INFO - Epoch 386 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886566 weight_norm_u: 25.222990 loss: 0.010317 +RANK_0 - 2026-01-29 06:42:42,751 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN - Minibatch 0: weight_norm_model: 143.886566 loss: 0.016191 grad_norm_before_clip: 1.138733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:43,985 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886566 weight_norm_u: 25.218954 loss: 0.016191 grad_norm_before_clip: 1.138733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:43,986 - TRAIN-LOGGER - INFO - Epoch 387 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886581 weight_norm_u: 25.222990 loss: 0.009398 +RANK_0 - 2026-01-29 06:42:50,487 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN - Minibatch 0: weight_norm_model: 143.886581 loss: 0.013727 grad_norm_before_clip: 1.004143 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:51,689 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886581 weight_norm_u: 25.218954 loss: 0.013727 grad_norm_before_clip: 1.004143 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:51,689 - TRAIN-LOGGER - INFO - Epoch 388 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886597 weight_norm_u: 25.222990 loss: 0.009474 +RANK_0 - 2026-01-29 06:42:58,716 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN - Minibatch 0: weight_norm_model: 143.886597 loss: 0.015095 grad_norm_before_clip: 0.893710 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:59,961 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886597 weight_norm_u: 25.218954 loss: 0.015095 grad_norm_before_clip: 0.893710 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:42:59,961 - TRAIN-LOGGER - INFO - Epoch 389 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886612 weight_norm_u: 25.222990 loss: 0.010488 +RANK_0 - 2026-01-29 06:43:06,791 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN - Minibatch 0: weight_norm_model: 143.886612 loss: 0.018618 grad_norm_before_clip: 1.269950 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:08,122 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886612 weight_norm_u: 25.218954 loss: 0.018618 grad_norm_before_clip: 1.269950 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:08,122 - TRAIN-LOGGER - INFO - Epoch 390 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886642 weight_norm_u: 25.222990 loss: 0.011076 +RANK_0 - 2026-01-29 06:43:13,867 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN - Minibatch 0: weight_norm_model: 143.886642 loss: 0.017378 grad_norm_before_clip: 1.464506 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:15,207 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886642 weight_norm_u: 25.218954 loss: 0.017378 grad_norm_before_clip: 1.464506 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:15,208 - TRAIN-LOGGER - INFO - Epoch 391 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886673 weight_norm_u: 25.222990 loss: 0.010709 +RANK_0 - 2026-01-29 06:43:21,656 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN - Minibatch 0: weight_norm_model: 143.886673 loss: 0.016714 grad_norm_before_clip: 1.418280 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:22,781 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886673 weight_norm_u: 25.218954 loss: 0.016714 grad_norm_before_clip: 1.418280 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:22,781 - TRAIN-LOGGER - INFO - Epoch 392 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886703 weight_norm_u: 25.222990 loss: 0.009723 +RANK_0 - 2026-01-29 06:43:29,717 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN - Minibatch 0: weight_norm_model: 143.886703 loss: 0.013973 grad_norm_before_clip: 1.045274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:30,941 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886703 weight_norm_u: 25.218954 loss: 0.013973 grad_norm_before_clip: 1.045274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:30,941 - TRAIN-LOGGER - INFO - Epoch 393 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886734 weight_norm_u: 25.222990 loss: 0.009275 +RANK_0 - 2026-01-29 06:43:37,786 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN - Minibatch 0: weight_norm_model: 143.886734 loss: 0.016539 grad_norm_before_clip: 1.337043 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:38,988 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886734 weight_norm_u: 25.218954 loss: 0.016539 grad_norm_before_clip: 1.337043 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:38,988 - TRAIN-LOGGER - INFO - Epoch 394 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886749 weight_norm_u: 25.222990 loss: 0.009416 +RANK_0 - 2026-01-29 06:43:45,555 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN - Minibatch 0: weight_norm_model: 143.886749 loss: 0.015332 grad_norm_before_clip: 0.616711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:46,775 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886749 weight_norm_u: 25.218954 loss: 0.015332 grad_norm_before_clip: 0.616711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:46,776 - TRAIN-LOGGER - INFO - Epoch 395 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886780 weight_norm_u: 25.222990 loss: 0.009641 +RANK_0 - 2026-01-29 06:43:53,631 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN - Minibatch 0: weight_norm_model: 143.886780 loss: 0.016526 grad_norm_before_clip: 1.504740 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:54,806 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886780 weight_norm_u: 25.218954 loss: 0.016526 grad_norm_before_clip: 1.504740 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:43:54,806 - TRAIN-LOGGER - INFO - Epoch 396 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886795 weight_norm_u: 25.222990 loss: 0.009403 +RANK_0 - 2026-01-29 06:44:00,653 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN - Minibatch 0: weight_norm_model: 143.886795 loss: 0.026558 grad_norm_before_clip: 7.098713 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:01,903 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886795 weight_norm_u: 25.218954 loss: 0.026558 grad_norm_before_clip: 7.098713 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:01,903 - TRAIN-LOGGER - INFO - Epoch 397 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886826 weight_norm_u: 25.222990 loss: 0.009086 +RANK_0 - 2026-01-29 06:44:08,326 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN - Minibatch 0: weight_norm_model: 143.886826 loss: 0.012537 grad_norm_before_clip: 0.868462 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:09,516 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886826 weight_norm_u: 25.218954 loss: 0.012537 grad_norm_before_clip: 0.868462 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:09,516 - TRAIN-LOGGER - INFO - Epoch 398 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886856 weight_norm_u: 25.222990 loss: 0.009047 +RANK_0 - 2026-01-29 06:44:16,285 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN - Minibatch 0: weight_norm_model: 143.886856 loss: 0.014855 grad_norm_before_clip: 0.659608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:17,535 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886856 weight_norm_u: 25.218954 loss: 0.014855 grad_norm_before_clip: 0.659608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:17,535 - TRAIN-LOGGER - INFO - Epoch 399 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.009454 +RANK_0 - 2026-01-29 06:44:23,960 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.015363 grad_norm_before_clip: 0.705203 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:25,227 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.015363 grad_norm_before_clip: 0.705203 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:44:25,228 - TRAIN-LOGGER - INFO - Epoch 400 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.009725