diff --git "a/mocap09short/mocap09short_01-29-0610/logging/train.log" "b/mocap09short/mocap09short_01-29-0610/logging/train.log" new file mode 100644--- /dev/null +++ "b/mocap09short/mocap09short_01-29-0610/logging/train.log" @@ -0,0 +1,600 @@ +RANK_0 - 2026-01-29 06:10:47,928 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.091128 grad_norm_before_clip: 4.118011 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:10:49,113 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.091128 grad_norm_before_clip: 4.118011 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:10:49,113 - TRAIN-LOGGER - INFO - Epoch 201 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882462 weight_norm_u: 25.222990 loss: 0.103621 +RANK_0 - 2026-01-29 06:10:53,782 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN - Minibatch 0: weight_norm_model: 143.882462 loss: 0.129016 grad_norm_before_clip: 8.267133 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:10:54,939 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882462 weight_norm_u: 25.218954 loss: 0.129016 grad_norm_before_clip: 8.267133 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:10:54,939 - TRAIN-LOGGER - INFO - Epoch 202 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882462 weight_norm_u: 25.222990 loss: 0.093231 +RANK_0 - 2026-01-29 06:10:59,838 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN - Minibatch 0: weight_norm_model: 143.882462 loss: 0.105320 grad_norm_before_clip: 9.456820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:01,006 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882462 weight_norm_u: 25.218954 loss: 0.105320 grad_norm_before_clip: 9.456820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:01,007 - TRAIN-LOGGER - INFO - Epoch 203 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.070960 +RANK_0 - 2026-01-29 06:11:06,090 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.112817 grad_norm_before_clip: 8.145647 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:07,262 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.112817 grad_norm_before_clip: 8.145647 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:07,262 - TRAIN-LOGGER - INFO - Epoch 204 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.061096 +RANK_0 - 2026-01-29 06:11:12,170 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.079729 grad_norm_before_clip: 5.046020 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:13,348 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.079729 grad_norm_before_clip: 5.046020 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:13,348 - TRAIN-LOGGER - INFO - Epoch 205 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.070636 +RANK_0 - 2026-01-29 06:11:17,982 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.101154 grad_norm_before_clip: 7.432445 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:19,090 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.101154 grad_norm_before_clip: 7.432445 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:19,090 - TRAIN-LOGGER - INFO - Epoch 206 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882538 weight_norm_u: 25.222990 loss: 0.074133 +RANK_0 - 2026-01-29 06:11:23,918 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN - Minibatch 0: weight_norm_model: 143.882538 loss: 0.097196 grad_norm_before_clip: 5.714380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:25,042 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882538 weight_norm_u: 25.218954 loss: 0.097196 grad_norm_before_clip: 5.714380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:25,042 - TRAIN-LOGGER - INFO - Epoch 207 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.068900 +RANK_0 - 2026-01-29 06:11:29,253 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.086572 grad_norm_before_clip: 4.269865 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:30,432 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.086572 grad_norm_before_clip: 4.269865 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:30,432 - TRAIN-LOGGER - INFO - Epoch 208 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.063288 +RANK_0 - 2026-01-29 06:11:35,191 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.094755 grad_norm_before_clip: 4.435645 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:36,333 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.094755 grad_norm_before_clip: 4.435645 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:36,333 - TRAIN-LOGGER - INFO - Epoch 209 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.056494 +RANK_0 - 2026-01-29 06:11:41,188 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.074480 grad_norm_before_clip: 5.153675 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:42,297 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.074480 grad_norm_before_clip: 5.153675 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:42,297 - TRAIN-LOGGER - INFO - Epoch 210 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.052148 +RANK_0 - 2026-01-29 06:11:47,195 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.082617 grad_norm_before_clip: 2.546691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:48,299 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.082617 grad_norm_before_clip: 2.546691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:48,299 - TRAIN-LOGGER - INFO - Epoch 211 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.054638 +RANK_0 - 2026-01-29 06:11:52,692 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.092122 grad_norm_before_clip: 2.613146 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:53,863 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.092122 grad_norm_before_clip: 2.613146 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:53,864 - TRAIN-LOGGER - INFO - Epoch 212 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.056631 +RANK_0 - 2026-01-29 06:11:58,712 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.090432 grad_norm_before_clip: 4.997403 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:59,820 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.090432 grad_norm_before_clip: 4.997403 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:11:59,820 - TRAIN-LOGGER - INFO - Epoch 213 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.060380 +RANK_0 - 2026-01-29 06:12:04,400 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.085219 grad_norm_before_clip: 4.607562 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:05,504 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.085219 grad_norm_before_clip: 4.607562 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:05,504 - TRAIN-LOGGER - INFO - Epoch 214 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.060513 +RANK_0 - 2026-01-29 06:12:10,173 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.082793 grad_norm_before_clip: 3.463787 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:11,259 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.082793 grad_norm_before_clip: 3.463787 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:11,259 - TRAIN-LOGGER - INFO - Epoch 215 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.056925 +RANK_0 - 2026-01-29 06:12:15,638 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.074711 grad_norm_before_clip: 5.011795 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:16,830 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.074711 grad_norm_before_clip: 5.011795 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:16,830 - TRAIN-LOGGER - INFO - Epoch 216 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.051724 +RANK_0 - 2026-01-29 06:12:21,692 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.080707 grad_norm_before_clip: 2.874346 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:22,795 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.080707 grad_norm_before_clip: 2.874346 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:22,795 - TRAIN-LOGGER - INFO - Epoch 217 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.052635 +RANK_0 - 2026-01-29 06:12:27,536 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.069831 grad_norm_before_clip: 2.959546 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:28,748 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.069831 grad_norm_before_clip: 2.959546 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:28,748 - TRAIN-LOGGER - INFO - Epoch 218 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.055083 +RANK_0 - 2026-01-29 06:12:33,546 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.084411 grad_norm_before_clip: 3.362638 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:34,728 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.084411 grad_norm_before_clip: 3.362638 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:34,728 - TRAIN-LOGGER - INFO - Epoch 219 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.057342 +RANK_0 - 2026-01-29 06:12:39,577 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.087868 grad_norm_before_clip: 5.118343 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:40,693 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.087868 grad_norm_before_clip: 5.118343 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:40,693 - TRAIN-LOGGER - INFO - Epoch 220 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.056489 +RANK_0 - 2026-01-29 06:12:45,522 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.078224 grad_norm_before_clip: 4.406193 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:46,739 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.078224 grad_norm_before_clip: 4.406193 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:46,739 - TRAIN-LOGGER - INFO - Epoch 221 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.054026 +RANK_0 - 2026-01-29 06:12:51,756 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.076211 grad_norm_before_clip: 5.060658 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:52,912 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.076211 grad_norm_before_clip: 5.060658 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:52,912 - TRAIN-LOGGER - INFO - Epoch 222 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.051684 +RANK_0 - 2026-01-29 06:12:58,102 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.074369 grad_norm_before_clip: 1.752375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:59,349 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.074369 grad_norm_before_clip: 1.752375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:12:59,349 - TRAIN-LOGGER - INFO - Epoch 223 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.050607 +RANK_0 - 2026-01-29 06:13:04,303 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.089732 grad_norm_before_clip: 6.881398 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:05,469 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.089732 grad_norm_before_clip: 6.881398 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:05,469 - TRAIN-LOGGER - INFO - Epoch 224 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.050499 +RANK_0 - 2026-01-29 06:13:10,487 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.080581 grad_norm_before_clip: 4.698662 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:11,682 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.080581 grad_norm_before_clip: 4.698662 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:11,682 - TRAIN-LOGGER - INFO - Epoch 225 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.050999 +RANK_0 - 2026-01-29 06:13:16,553 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.081968 grad_norm_before_clip: 7.091703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:17,720 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.081968 grad_norm_before_clip: 7.091703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:17,721 - TRAIN-LOGGER - INFO - Epoch 226 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.049743 +RANK_0 - 2026-01-29 06:13:22,661 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.078096 grad_norm_before_clip: 3.630522 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:23,747 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.078096 grad_norm_before_clip: 3.630522 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:23,747 - TRAIN-LOGGER - INFO - Epoch 227 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.047850 +RANK_0 - 2026-01-29 06:13:28,156 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.068410 grad_norm_before_clip: 6.558546 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:29,264 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.068410 grad_norm_before_clip: 6.558546 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:29,264 - TRAIN-LOGGER - INFO - Epoch 228 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.048319 +RANK_0 - 2026-01-29 06:13:34,035 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.078961 grad_norm_before_clip: 5.426413 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:35,150 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.078961 grad_norm_before_clip: 5.426413 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:35,150 - TRAIN-LOGGER - INFO - Epoch 229 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.048539 +RANK_0 - 2026-01-29 06:13:39,891 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.073618 grad_norm_before_clip: 3.015783 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:41,023 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.073618 grad_norm_before_clip: 3.015783 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:41,023 - TRAIN-LOGGER - INFO - Epoch 230 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882584 weight_norm_u: 25.222990 loss: 0.050257 +RANK_0 - 2026-01-29 06:13:46,068 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN - Minibatch 0: weight_norm_model: 143.882584 loss: 0.064835 grad_norm_before_clip: 5.313970 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:47,291 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882584 weight_norm_u: 25.218954 loss: 0.064835 grad_norm_before_clip: 5.313970 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:47,292 - TRAIN-LOGGER - INFO - Epoch 231 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.051728 +RANK_0 - 2026-01-29 06:13:52,088 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.075073 grad_norm_before_clip: 5.025896 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:53,203 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.075073 grad_norm_before_clip: 5.025896 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:53,203 - TRAIN-LOGGER - INFO - Epoch 232 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.054744 +RANK_0 - 2026-01-29 06:13:58,286 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.074072 grad_norm_before_clip: 7.389863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:59,431 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.074072 grad_norm_before_clip: 7.389863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:13:59,431 - TRAIN-LOGGER - INFO - Epoch 233 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.057397 +RANK_0 - 2026-01-29 06:14:04,512 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.090834 grad_norm_before_clip: 6.880458 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:05,725 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.090834 grad_norm_before_clip: 6.880458 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:05,725 - TRAIN-LOGGER - INFO - Epoch 234 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.054754 +RANK_0 - 2026-01-29 06:14:10,074 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.084786 grad_norm_before_clip: 4.414435 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:11,262 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.084786 grad_norm_before_clip: 4.414435 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:11,263 - TRAIN-LOGGER - INFO - Epoch 235 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.049171 +RANK_0 - 2026-01-29 06:14:16,246 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.065086 grad_norm_before_clip: 2.746821 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:17,465 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.065086 grad_norm_before_clip: 2.746821 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:17,465 - TRAIN-LOGGER - INFO - Epoch 236 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.050318 +RANK_0 - 2026-01-29 06:14:22,350 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.081385 grad_norm_before_clip: 5.134715 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:23,450 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.081385 grad_norm_before_clip: 5.134715 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:23,450 - TRAIN-LOGGER - INFO - Epoch 237 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.053264 +RANK_0 - 2026-01-29 06:14:28,463 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.077270 grad_norm_before_clip: 5.571516 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:29,657 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.077270 grad_norm_before_clip: 5.571516 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:29,658 - TRAIN-LOGGER - INFO - Epoch 238 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.055903 +RANK_0 - 2026-01-29 06:14:34,518 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.070487 grad_norm_before_clip: 7.238018 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:35,710 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.070487 grad_norm_before_clip: 7.238018 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:35,710 - TRAIN-LOGGER - INFO - Epoch 239 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.058092 +RANK_0 - 2026-01-29 06:14:40,730 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.073484 grad_norm_before_clip: 6.472335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:41,883 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.073484 grad_norm_before_clip: 6.472335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:41,883 - TRAIN-LOGGER - INFO - Epoch 240 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.058032 +RANK_0 - 2026-01-29 06:14:47,088 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.094773 grad_norm_before_clip: 6.892994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:48,470 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.094773 grad_norm_before_clip: 6.892994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:48,470 - TRAIN-LOGGER - INFO - Epoch 241 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.054370 +RANK_0 - 2026-01-29 06:14:53,334 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.076949 grad_norm_before_clip: 6.326024 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:54,602 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.076949 grad_norm_before_clip: 6.326024 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:14:54,602 - TRAIN-LOGGER - INFO - Epoch 242 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.048184 +RANK_0 - 2026-01-29 06:14:59,609 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.075502 grad_norm_before_clip: 4.285368 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:00,844 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.075502 grad_norm_before_clip: 4.285368 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:00,845 - TRAIN-LOGGER - INFO - Epoch 243 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882690 weight_norm_u: 25.222990 loss: 0.043576 +RANK_0 - 2026-01-29 06:15:06,191 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN - Minibatch 0: weight_norm_model: 143.882690 loss: 0.061144 grad_norm_before_clip: 1.525608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:07,418 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882690 weight_norm_u: 25.218954 loss: 0.061144 grad_norm_before_clip: 1.525608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:07,418 - TRAIN-LOGGER - INFO - Epoch 244 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.052266 +RANK_0 - 2026-01-29 06:15:12,267 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.066736 grad_norm_before_clip: 6.139614 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:13,515 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.066736 grad_norm_before_clip: 6.139614 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:13,515 - TRAIN-LOGGER - INFO - Epoch 245 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.061255 +RANK_0 - 2026-01-29 06:15:18,564 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.069133 grad_norm_before_clip: 4.895175 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:19,735 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.069133 grad_norm_before_clip: 4.895175 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:19,735 - TRAIN-LOGGER - INFO - Epoch 246 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882767 weight_norm_u: 25.222990 loss: 0.065742 +RANK_0 - 2026-01-29 06:15:24,985 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN - Minibatch 0: weight_norm_model: 143.882767 loss: 0.100201 grad_norm_before_clip: 11.125077 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:26,213 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882767 weight_norm_u: 25.218954 loss: 0.100201 grad_norm_before_clip: 11.125077 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:26,213 - TRAIN-LOGGER - INFO - Epoch 247 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.063628 +RANK_0 - 2026-01-29 06:15:31,170 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.069397 grad_norm_before_clip: 6.412019 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:32,326 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.069397 grad_norm_before_clip: 6.412019 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:32,326 - TRAIN-LOGGER - INFO - Epoch 248 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.055575 +RANK_0 - 2026-01-29 06:15:37,806 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.076954 grad_norm_before_clip: 5.437313 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:39,046 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.076954 grad_norm_before_clip: 5.437313 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:39,046 - TRAIN-LOGGER - INFO - Epoch 249 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.048524 +RANK_0 - 2026-01-29 06:15:43,962 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.071913 grad_norm_before_clip: 3.722538 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:45,155 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.071913 grad_norm_before_clip: 3.722538 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:45,156 - TRAIN-LOGGER - INFO - Epoch 250 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.048053 +RANK_0 - 2026-01-29 06:15:50,425 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.072103 grad_norm_before_clip: 2.852268 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:51,711 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.072103 grad_norm_before_clip: 2.852268 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:51,712 - TRAIN-LOGGER - INFO - Epoch 251 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.051622 +RANK_0 - 2026-01-29 06:15:56,917 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.084275 grad_norm_before_clip: 6.235590 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:58,210 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.084275 grad_norm_before_clip: 6.235590 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:15:58,210 - TRAIN-LOGGER - INFO - Epoch 252 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.053348 +RANK_0 - 2026-01-29 06:16:03,287 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.083830 grad_norm_before_clip: 8.129601 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:04,689 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.083830 grad_norm_before_clip: 8.129601 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:04,690 - TRAIN-LOGGER - INFO - Epoch 253 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.053266 +RANK_0 - 2026-01-29 06:16:10,222 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.086835 grad_norm_before_clip: 6.597581 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:11,518 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.086835 grad_norm_before_clip: 6.597581 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:11,519 - TRAIN-LOGGER - INFO - Epoch 254 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882797 weight_norm_u: 25.222990 loss: 0.052373 +RANK_0 - 2026-01-29 06:16:16,173 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN - Minibatch 0: weight_norm_model: 143.882797 loss: 0.081515 grad_norm_before_clip: 5.767548 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:17,353 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882797 weight_norm_u: 25.218954 loss: 0.081515 grad_norm_before_clip: 5.767548 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:17,353 - TRAIN-LOGGER - INFO - Epoch 255 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882828 weight_norm_u: 25.222990 loss: 0.052094 +RANK_0 - 2026-01-29 06:16:23,037 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN - Minibatch 0: weight_norm_model: 143.882828 loss: 0.076157 grad_norm_before_clip: 5.255727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:24,210 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882828 weight_norm_u: 25.218954 loss: 0.076157 grad_norm_before_clip: 5.255727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:24,210 - TRAIN-LOGGER - INFO - Epoch 256 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882858 weight_norm_u: 25.222990 loss: 0.051741 +RANK_0 - 2026-01-29 06:16:29,400 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN - Minibatch 0: weight_norm_model: 143.882858 loss: 0.069037 grad_norm_before_clip: 8.929213 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:30,683 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882858 weight_norm_u: 25.218954 loss: 0.069037 grad_norm_before_clip: 8.929213 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:30,683 - TRAIN-LOGGER - INFO - Epoch 257 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.048277 +RANK_0 - 2026-01-29 06:16:35,959 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.071508 grad_norm_before_clip: 5.510832 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:37,253 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.071508 grad_norm_before_clip: 5.510832 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:37,253 - TRAIN-LOGGER - INFO - Epoch 258 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.044374 +RANK_0 - 2026-01-29 06:16:42,556 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.063023 grad_norm_before_clip: 5.015406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:43,791 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.063023 grad_norm_before_clip: 5.015406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:43,791 - TRAIN-LOGGER - INFO - Epoch 259 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882828 weight_norm_u: 25.222990 loss: 0.044317 +RANK_0 - 2026-01-29 06:16:48,960 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN - Minibatch 0: weight_norm_model: 143.882828 loss: 0.066364 grad_norm_before_clip: 5.672312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:50,187 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882828 weight_norm_u: 25.218954 loss: 0.066364 grad_norm_before_clip: 5.672312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:50,187 - TRAIN-LOGGER - INFO - Epoch 260 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.045488 +RANK_0 - 2026-01-29 06:16:55,668 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.070445 grad_norm_before_clip: 3.828708 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:56,838 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.070445 grad_norm_before_clip: 3.828708 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:16:56,838 - TRAIN-LOGGER - INFO - Epoch 261 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882797 weight_norm_u: 25.222990 loss: 0.047850 +RANK_0 - 2026-01-29 06:17:02,052 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN - Minibatch 0: weight_norm_model: 143.882797 loss: 0.065157 grad_norm_before_clip: 5.619667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:03,370 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882797 weight_norm_u: 25.218954 loss: 0.065157 grad_norm_before_clip: 5.619667 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:03,370 - TRAIN-LOGGER - INFO - Epoch 262 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.047176 +RANK_0 - 2026-01-29 06:17:08,519 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.071667 grad_norm_before_clip: 5.452256 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:09,748 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.071667 grad_norm_before_clip: 5.452256 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:09,748 - TRAIN-LOGGER - INFO - Epoch 263 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.043920 +RANK_0 - 2026-01-29 06:17:15,608 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.069269 grad_norm_before_clip: 4.345649 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:16,838 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.069269 grad_norm_before_clip: 4.345649 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:16,838 - TRAIN-LOGGER - INFO - Epoch 264 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882858 weight_norm_u: 25.222990 loss: 0.043085 +RANK_0 - 2026-01-29 06:17:22,417 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN - Minibatch 0: weight_norm_model: 143.882858 loss: 0.081125 grad_norm_before_clip: 4.339257 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:23,728 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882858 weight_norm_u: 25.218954 loss: 0.081125 grad_norm_before_clip: 4.339257 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:23,728 - TRAIN-LOGGER - INFO - Epoch 265 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.045340 +RANK_0 - 2026-01-29 06:17:29,054 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.072972 grad_norm_before_clip: 4.804296 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:30,259 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.072972 grad_norm_before_clip: 4.804296 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:30,259 - TRAIN-LOGGER - INFO - Epoch 266 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882919 weight_norm_u: 25.222990 loss: 0.054108 +RANK_0 - 2026-01-29 06:17:35,311 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN - Minibatch 0: weight_norm_model: 143.882919 loss: 0.084153 grad_norm_before_clip: 10.614285 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:36,553 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882919 weight_norm_u: 25.218954 loss: 0.084153 grad_norm_before_clip: 10.614285 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:36,553 - TRAIN-LOGGER - INFO - Epoch 267 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.058378 +RANK_0 - 2026-01-29 06:17:41,504 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.076771 grad_norm_before_clip: 10.061653 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:42,660 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.076771 grad_norm_before_clip: 10.061653 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:42,660 - TRAIN-LOGGER - INFO - Epoch 268 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.055684 +RANK_0 - 2026-01-29 06:17:47,892 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.086963 grad_norm_before_clip: 9.052341 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:49,074 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.086963 grad_norm_before_clip: 9.052341 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:49,074 - TRAIN-LOGGER - INFO - Epoch 269 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882904 weight_norm_u: 25.222990 loss: 0.047490 +RANK_0 - 2026-01-29 06:17:54,221 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN - Minibatch 0: weight_norm_model: 143.882904 loss: 0.071765 grad_norm_before_clip: 4.789957 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:55,349 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882904 weight_norm_u: 25.218954 loss: 0.071765 grad_norm_before_clip: 4.789957 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:17:55,350 - TRAIN-LOGGER - INFO - Epoch 270 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.042613 +RANK_0 - 2026-01-29 06:18:00,704 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.074289 grad_norm_before_clip: 2.882898 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:02,101 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.074289 grad_norm_before_clip: 2.882898 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:02,101 - TRAIN-LOGGER - INFO - Epoch 271 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.044262 +RANK_0 - 2026-01-29 06:18:07,839 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.082919 grad_norm_before_clip: 5.532194 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:09,150 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.082919 grad_norm_before_clip: 5.532194 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:09,151 - TRAIN-LOGGER - INFO - Epoch 272 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.047170 +RANK_0 - 2026-01-29 06:18:14,218 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.065576 grad_norm_before_clip: 6.416017 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:15,392 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.065576 grad_norm_before_clip: 6.416017 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:15,393 - TRAIN-LOGGER - INFO - Epoch 273 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.048714 +RANK_0 - 2026-01-29 06:18:20,033 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.083245 grad_norm_before_clip: 6.279256 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:21,200 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.083245 grad_norm_before_clip: 6.279256 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:21,200 - TRAIN-LOGGER - INFO - Epoch 274 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.051403 +RANK_0 - 2026-01-29 06:18:27,170 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.064257 grad_norm_before_clip: 5.486085 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:28,383 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.064257 grad_norm_before_clip: 5.486085 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:28,384 - TRAIN-LOGGER - INFO - Epoch 275 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882919 weight_norm_u: 25.222990 loss: 0.049827 +RANK_0 - 2026-01-29 06:18:33,747 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN - Minibatch 0: weight_norm_model: 143.882919 loss: 0.076542 grad_norm_before_clip: 6.228782 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:35,061 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882919 weight_norm_u: 25.218954 loss: 0.076542 grad_norm_before_clip: 6.228782 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:35,061 - TRAIN-LOGGER - INFO - Epoch 276 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882950 weight_norm_u: 25.222990 loss: 0.048809 +RANK_0 - 2026-01-29 06:18:40,240 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN - Minibatch 0: weight_norm_model: 143.882950 loss: 0.080722 grad_norm_before_clip: 3.629990 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:41,442 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882950 weight_norm_u: 25.218954 loss: 0.080722 grad_norm_before_clip: 3.629990 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:41,443 - TRAIN-LOGGER - INFO - Epoch 277 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882980 weight_norm_u: 25.222990 loss: 0.051993 +RANK_0 - 2026-01-29 06:18:46,679 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN - Minibatch 0: weight_norm_model: 143.882980 loss: 0.077047 grad_norm_before_clip: 5.256445 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:48,123 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882980 weight_norm_u: 25.218954 loss: 0.077047 grad_norm_before_clip: 5.256445 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:48,124 - TRAIN-LOGGER - INFO - Epoch 278 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.054372 +RANK_0 - 2026-01-29 06:18:54,356 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.067811 grad_norm_before_clip: 5.659521 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:55,642 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.067811 grad_norm_before_clip: 5.659521 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:18:55,642 - TRAIN-LOGGER - INFO - Epoch 279 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.053037 +RANK_0 - 2026-01-29 06:19:01,346 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.088634 grad_norm_before_clip: 6.382757 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:02,659 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.088634 grad_norm_before_clip: 6.382757 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:02,660 - TRAIN-LOGGER - INFO - Epoch 280 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.046473 +RANK_0 - 2026-01-29 06:19:08,091 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.073396 grad_norm_before_clip: 6.691931 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:09,602 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.073396 grad_norm_before_clip: 6.691931 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:09,602 - TRAIN-LOGGER - INFO - Epoch 281 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882980 weight_norm_u: 25.222990 loss: 0.039945 +RANK_0 - 2026-01-29 06:19:15,740 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN - Minibatch 0: weight_norm_model: 143.882980 loss: 0.068790 grad_norm_before_clip: 2.737377 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:17,071 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882980 weight_norm_u: 25.218954 loss: 0.068790 grad_norm_before_clip: 2.737377 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:17,072 - TRAIN-LOGGER - INFO - Epoch 282 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882965 weight_norm_u: 25.222990 loss: 0.040241 +RANK_0 - 2026-01-29 06:19:23,890 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN - Minibatch 0: weight_norm_model: 143.882965 loss: 0.073706 grad_norm_before_clip: 4.714820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:25,131 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882965 weight_norm_u: 25.218954 loss: 0.073706 grad_norm_before_clip: 4.714820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:25,131 - TRAIN-LOGGER - INFO - Epoch 283 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882965 weight_norm_u: 25.222990 loss: 0.043453 +RANK_0 - 2026-01-29 06:19:30,881 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN - Minibatch 0: weight_norm_model: 143.882965 loss: 0.066522 grad_norm_before_clip: 4.638680 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:32,432 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882965 weight_norm_u: 25.218954 loss: 0.066522 grad_norm_before_clip: 4.638680 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:32,432 - TRAIN-LOGGER - INFO - Epoch 284 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882980 weight_norm_u: 25.222990 loss: 0.044407 +RANK_0 - 2026-01-29 06:19:38,615 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN - Minibatch 0: weight_norm_model: 143.882980 loss: 0.079892 grad_norm_before_clip: 4.427885 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:40,121 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882980 weight_norm_u: 25.218954 loss: 0.079892 grad_norm_before_clip: 4.427885 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:40,121 - TRAIN-LOGGER - INFO - Epoch 285 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.043046 +RANK_0 - 2026-01-29 06:19:46,109 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.070066 grad_norm_before_clip: 5.859819 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:47,555 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.070066 grad_norm_before_clip: 5.859819 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:47,555 - TRAIN-LOGGER - INFO - Epoch 286 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883011 weight_norm_u: 25.222990 loss: 0.040544 +RANK_0 - 2026-01-29 06:19:54,485 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN - Minibatch 0: weight_norm_model: 143.883011 loss: 0.068998 grad_norm_before_clip: 5.501777 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:55,852 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883011 weight_norm_u: 25.218954 loss: 0.068998 grad_norm_before_clip: 5.501777 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:19:55,852 - TRAIN-LOGGER - INFO - Epoch 287 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883041 weight_norm_u: 25.222990 loss: 0.042918 +RANK_0 - 2026-01-29 06:20:01,849 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN - Minibatch 0: weight_norm_model: 143.883041 loss: 0.062878 grad_norm_before_clip: 3.727001 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:03,404 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883041 weight_norm_u: 25.218954 loss: 0.062878 grad_norm_before_clip: 3.727001 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:03,404 - TRAIN-LOGGER - INFO - Epoch 288 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883041 weight_norm_u: 25.222990 loss: 0.047053 +RANK_0 - 2026-01-29 06:20:10,715 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN - Minibatch 0: weight_norm_model: 143.883041 loss: 0.075565 grad_norm_before_clip: 5.246312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:12,412 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883041 weight_norm_u: 25.218954 loss: 0.075565 grad_norm_before_clip: 5.246312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:12,412 - TRAIN-LOGGER - INFO - Epoch 289 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883026 weight_norm_u: 25.222990 loss: 0.047144 +RANK_0 - 2026-01-29 06:20:19,011 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN - Minibatch 0: weight_norm_model: 143.883026 loss: 0.080314 grad_norm_before_clip: 4.565568 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:20,800 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883026 weight_norm_u: 25.218954 loss: 0.080314 grad_norm_before_clip: 4.565568 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:20,800 - TRAIN-LOGGER - INFO - Epoch 290 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883011 weight_norm_u: 25.222990 loss: 0.046704 +RANK_0 - 2026-01-29 06:20:27,105 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN - Minibatch 0: weight_norm_model: 143.883011 loss: 0.076390 grad_norm_before_clip: 2.580358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:28,545 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883011 weight_norm_u: 25.218954 loss: 0.076390 grad_norm_before_clip: 2.580358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:28,545 - TRAIN-LOGGER - INFO - Epoch 291 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883011 weight_norm_u: 25.222990 loss: 0.044817 +RANK_0 - 2026-01-29 06:20:35,362 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN - Minibatch 0: weight_norm_model: 143.883011 loss: 0.070206 grad_norm_before_clip: 2.452737 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:36,867 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883011 weight_norm_u: 25.218954 loss: 0.070206 grad_norm_before_clip: 2.452737 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:36,868 - TRAIN-LOGGER - INFO - Epoch 292 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883011 weight_norm_u: 25.222990 loss: 0.044152 +RANK_0 - 2026-01-29 06:20:43,696 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN - Minibatch 0: weight_norm_model: 143.883011 loss: 0.068296 grad_norm_before_clip: 5.024526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:44,988 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883011 weight_norm_u: 25.218954 loss: 0.068296 grad_norm_before_clip: 5.024526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:44,989 - TRAIN-LOGGER - INFO - Epoch 293 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883041 weight_norm_u: 25.222990 loss: 0.045489 +RANK_0 - 2026-01-29 06:20:50,790 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN - Minibatch 0: weight_norm_model: 143.883041 loss: 0.076005 grad_norm_before_clip: 5.339447 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:52,459 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883041 weight_norm_u: 25.218954 loss: 0.076005 grad_norm_before_clip: 5.339447 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:20:52,460 - TRAIN-LOGGER - INFO - Epoch 294 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883072 weight_norm_u: 25.222990 loss: 0.044332 +RANK_0 - 2026-01-29 06:20:58,737 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN - Minibatch 0: weight_norm_model: 143.883072 loss: 0.065134 grad_norm_before_clip: 4.217087 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:00,277 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883072 weight_norm_u: 25.218954 loss: 0.065134 grad_norm_before_clip: 4.217087 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:00,277 - TRAIN-LOGGER - INFO - Epoch 295 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883102 weight_norm_u: 25.222990 loss: 0.040924 +RANK_0 - 2026-01-29 06:21:06,971 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN - Minibatch 0: weight_norm_model: 143.883102 loss: 0.068539 grad_norm_before_clip: 1.913159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:08,577 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883102 weight_norm_u: 25.218954 loss: 0.068539 grad_norm_before_clip: 1.913159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:08,577 - TRAIN-LOGGER - INFO - Epoch 296 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.040195 +RANK_0 - 2026-01-29 06:21:14,880 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.069755 grad_norm_before_clip: 2.860994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:16,167 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.069755 grad_norm_before_clip: 2.860994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:16,167 - TRAIN-LOGGER - INFO - Epoch 297 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.040954 +RANK_0 - 2026-01-29 06:21:22,154 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.059483 grad_norm_before_clip: 1.591952 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:23,707 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.059483 grad_norm_before_clip: 1.591952 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:23,707 - TRAIN-LOGGER - INFO - Epoch 298 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.046436 +RANK_0 - 2026-01-29 06:21:30,717 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.066419 grad_norm_before_clip: 4.546567 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:32,321 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.066419 grad_norm_before_clip: 4.546567 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:32,321 - TRAIN-LOGGER - INFO - Epoch 299 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.048936 +RANK_0 - 2026-01-29 06:21:38,258 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.080023 grad_norm_before_clip: 4.984536 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:39,583 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.080023 grad_norm_before_clip: 4.984536 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:39,583 - TRAIN-LOGGER - INFO - Epoch 300 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.047309 +RANK_0 - 2026-01-29 06:21:46,355 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.065379 grad_norm_before_clip: 3.658383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:47,642 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.065379 grad_norm_before_clip: 3.658383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:47,642 - TRAIN-LOGGER - INFO - Epoch 301 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883148 weight_norm_u: 25.222990 loss: 0.043698 +RANK_0 - 2026-01-29 06:21:53,775 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN - Minibatch 0: weight_norm_model: 143.883148 loss: 0.071282 grad_norm_before_clip: 4.376911 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:55,126 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883148 weight_norm_u: 25.218954 loss: 0.071282 grad_norm_before_clip: 4.376911 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:21:55,126 - TRAIN-LOGGER - INFO - Epoch 302 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883148 weight_norm_u: 25.222990 loss: 0.042491 +RANK_0 - 2026-01-29 06:22:01,939 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN - Minibatch 0: weight_norm_model: 143.883148 loss: 0.067227 grad_norm_before_clip: 2.905426 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:03,832 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883148 weight_norm_u: 25.218954 loss: 0.067227 grad_norm_before_clip: 2.905426 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:03,832 - TRAIN-LOGGER - INFO - Epoch 303 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.045175 +RANK_0 - 2026-01-29 06:22:10,205 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.069711 grad_norm_before_clip: 4.290107 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:11,740 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.069711 grad_norm_before_clip: 4.290107 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:11,741 - TRAIN-LOGGER - INFO - Epoch 304 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883194 weight_norm_u: 25.222990 loss: 0.047643 +RANK_0 - 2026-01-29 06:22:18,732 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN - Minibatch 0: weight_norm_model: 143.883194 loss: 0.061099 grad_norm_before_clip: 3.625621 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:20,144 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883194 weight_norm_u: 25.218954 loss: 0.061099 grad_norm_before_clip: 3.625621 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:20,145 - TRAIN-LOGGER - INFO - Epoch 305 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.048291 +RANK_0 - 2026-01-29 06:22:27,143 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.085271 grad_norm_before_clip: 6.657516 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:28,808 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.085271 grad_norm_before_clip: 6.657516 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:28,809 - TRAIN-LOGGER - INFO - Epoch 306 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883240 weight_norm_u: 25.222990 loss: 0.043436 +RANK_0 - 2026-01-29 06:22:36,229 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN - Minibatch 0: weight_norm_model: 143.883240 loss: 0.068264 grad_norm_before_clip: 3.597324 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:37,544 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883240 weight_norm_u: 25.218954 loss: 0.068264 grad_norm_before_clip: 3.597324 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:37,545 - TRAIN-LOGGER - INFO - Epoch 307 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883255 weight_norm_u: 25.222990 loss: 0.039672 +RANK_0 - 2026-01-29 06:22:44,187 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN - Minibatch 0: weight_norm_model: 143.883255 loss: 0.067839 grad_norm_before_clip: 3.486828 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:45,479 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883255 weight_norm_u: 25.218954 loss: 0.067839 grad_norm_before_clip: 3.486828 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:45,479 - TRAIN-LOGGER - INFO - Epoch 308 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883255 weight_norm_u: 25.222990 loss: 0.036656 +RANK_0 - 2026-01-29 06:22:51,669 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN - Minibatch 0: weight_norm_model: 143.883255 loss: 0.061230 grad_norm_before_clip: 2.684871 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:53,053 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883255 weight_norm_u: 25.218954 loss: 0.061230 grad_norm_before_clip: 2.684871 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:22:53,054 - TRAIN-LOGGER - INFO - Epoch 309 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883255 weight_norm_u: 25.222990 loss: 0.042207 +RANK_0 - 2026-01-29 06:23:00,593 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN - Minibatch 0: weight_norm_model: 143.883255 loss: 0.069861 grad_norm_before_clip: 2.697728 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:02,037 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883255 weight_norm_u: 25.218954 loss: 0.069861 grad_norm_before_clip: 2.697728 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:02,038 - TRAIN-LOGGER - INFO - Epoch 310 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883270 weight_norm_u: 25.222990 loss: 0.049758 +RANK_0 - 2026-01-29 06:23:08,700 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN - Minibatch 0: weight_norm_model: 143.883270 loss: 0.066189 grad_norm_before_clip: 5.333312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:10,159 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883270 weight_norm_u: 25.218954 loss: 0.066189 grad_norm_before_clip: 5.333312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:10,159 - TRAIN-LOGGER - INFO - Epoch 311 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883286 weight_norm_u: 25.222990 loss: 0.052136 +RANK_0 - 2026-01-29 06:23:16,539 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN - Minibatch 0: weight_norm_model: 143.883286 loss: 0.069900 grad_norm_before_clip: 6.504792 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:17,838 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883286 weight_norm_u: 25.218954 loss: 0.069900 grad_norm_before_clip: 6.504792 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:17,839 - TRAIN-LOGGER - INFO - Epoch 312 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883301 weight_norm_u: 25.222990 loss: 0.050209 +RANK_0 - 2026-01-29 06:23:24,442 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN - Minibatch 0: weight_norm_model: 143.883301 loss: 0.080758 grad_norm_before_clip: 3.144161 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:25,732 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883301 weight_norm_u: 25.218954 loss: 0.080758 grad_norm_before_clip: 3.144161 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:25,733 - TRAIN-LOGGER - INFO - Epoch 313 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883347 weight_norm_u: 25.222990 loss: 0.045801 +RANK_0 - 2026-01-29 06:23:30,971 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN - Minibatch 0: weight_norm_model: 143.883347 loss: 0.067178 grad_norm_before_clip: 4.554863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:32,572 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883347 weight_norm_u: 25.218954 loss: 0.067178 grad_norm_before_clip: 4.554863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:32,573 - TRAIN-LOGGER - INFO - Epoch 314 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883362 weight_norm_u: 25.222990 loss: 0.044251 +RANK_0 - 2026-01-29 06:23:39,418 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN - Minibatch 0: weight_norm_model: 143.883362 loss: 0.068463 grad_norm_before_clip: 4.930518 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:40,914 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883362 weight_norm_u: 25.218954 loss: 0.068463 grad_norm_before_clip: 4.930518 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:40,915 - TRAIN-LOGGER - INFO - Epoch 315 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883362 weight_norm_u: 25.222990 loss: 0.045107 +RANK_0 - 2026-01-29 06:23:48,014 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN - Minibatch 0: weight_norm_model: 143.883362 loss: 0.065558 grad_norm_before_clip: 3.955374 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:49,296 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883362 weight_norm_u: 25.218954 loss: 0.065558 grad_norm_before_clip: 3.955374 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:49,297 - TRAIN-LOGGER - INFO - Epoch 316 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883362 weight_norm_u: 25.222990 loss: 0.048392 +RANK_0 - 2026-01-29 06:23:56,491 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN - Minibatch 0: weight_norm_model: 143.883362 loss: 0.074020 grad_norm_before_clip: 4.799233 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:58,309 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883362 weight_norm_u: 25.218954 loss: 0.074020 grad_norm_before_clip: 4.799233 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:23:58,309 - TRAIN-LOGGER - INFO - Epoch 317 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883331 weight_norm_u: 25.222990 loss: 0.054431 +RANK_0 - 2026-01-29 06:24:04,137 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN - Minibatch 0: weight_norm_model: 143.883331 loss: 0.081714 grad_norm_before_clip: 5.332095 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:05,688 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883331 weight_norm_u: 25.218954 loss: 0.081714 grad_norm_before_clip: 5.332095 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:05,688 - TRAIN-LOGGER - INFO - Epoch 318 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883331 weight_norm_u: 25.222990 loss: 0.053614 +RANK_0 - 2026-01-29 06:24:11,498 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN - Minibatch 0: weight_norm_model: 143.883331 loss: 0.079111 grad_norm_before_clip: 4.222140 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:12,987 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883331 weight_norm_u: 25.218954 loss: 0.079111 grad_norm_before_clip: 4.222140 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:12,987 - TRAIN-LOGGER - INFO - Epoch 319 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883347 weight_norm_u: 25.222990 loss: 0.046858 +RANK_0 - 2026-01-29 06:24:19,596 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN - Minibatch 0: weight_norm_model: 143.883347 loss: 0.085472 grad_norm_before_clip: 5.798397 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:21,349 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883347 weight_norm_u: 25.218954 loss: 0.085472 grad_norm_before_clip: 5.798397 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:21,349 - TRAIN-LOGGER - INFO - Epoch 320 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883362 weight_norm_u: 25.222990 loss: 0.039776 +RANK_0 - 2026-01-29 06:24:27,808 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN - Minibatch 0: weight_norm_model: 143.883362 loss: 0.079142 grad_norm_before_clip: 4.989261 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:29,289 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883362 weight_norm_u: 25.218954 loss: 0.079142 grad_norm_before_clip: 4.989261 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:29,290 - TRAIN-LOGGER - INFO - Epoch 321 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883377 weight_norm_u: 25.222990 loss: 0.039893 +RANK_0 - 2026-01-29 06:24:35,390 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN - Minibatch 0: weight_norm_model: 143.883377 loss: 0.066031 grad_norm_before_clip: 3.888098 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:36,847 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883377 weight_norm_u: 25.218954 loss: 0.066031 grad_norm_before_clip: 3.888098 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:36,847 - TRAIN-LOGGER - INFO - Epoch 322 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883392 weight_norm_u: 25.222990 loss: 0.043321 +RANK_0 - 2026-01-29 06:24:43,723 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN - Minibatch 0: weight_norm_model: 143.883392 loss: 0.070914 grad_norm_before_clip: 4.328291 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:44,966 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883392 weight_norm_u: 25.218954 loss: 0.070914 grad_norm_before_clip: 4.328291 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:44,966 - TRAIN-LOGGER - INFO - Epoch 323 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883408 weight_norm_u: 25.222990 loss: 0.045411 +RANK_0 - 2026-01-29 06:24:51,899 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN - Minibatch 0: weight_norm_model: 143.883408 loss: 0.077519 grad_norm_before_clip: 4.035014 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:53,275 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883408 weight_norm_u: 25.218954 loss: 0.077519 grad_norm_before_clip: 4.035014 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:24:53,276 - TRAIN-LOGGER - INFO - Epoch 324 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883408 weight_norm_u: 25.222990 loss: 0.043467 +RANK_0 - 2026-01-29 06:25:01,253 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN - Minibatch 0: weight_norm_model: 143.883408 loss: 0.075146 grad_norm_before_clip: 4.567671 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:02,969 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883408 weight_norm_u: 25.218954 loss: 0.075146 grad_norm_before_clip: 4.567671 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:02,969 - TRAIN-LOGGER - INFO - Epoch 325 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.041462 +RANK_0 - 2026-01-29 06:25:09,015 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.070456 grad_norm_before_clip: 4.950870 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:10,870 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.070456 grad_norm_before_clip: 4.950870 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:10,871 - TRAIN-LOGGER - INFO - Epoch 326 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883438 weight_norm_u: 25.222990 loss: 0.041570 +RANK_0 - 2026-01-29 06:25:16,895 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN - Minibatch 0: weight_norm_model: 143.883438 loss: 0.067967 grad_norm_before_clip: 2.835335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:18,717 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883438 weight_norm_u: 25.218954 loss: 0.067967 grad_norm_before_clip: 2.835335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:18,717 - TRAIN-LOGGER - INFO - Epoch 327 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883453 weight_norm_u: 25.222990 loss: 0.040376 +RANK_0 - 2026-01-29 06:25:25,207 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN - Minibatch 0: weight_norm_model: 143.883453 loss: 0.067116 grad_norm_before_clip: 4.255139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:26,462 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883453 weight_norm_u: 25.218954 loss: 0.067116 grad_norm_before_clip: 4.255139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:26,462 - TRAIN-LOGGER - INFO - Epoch 328 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883469 weight_norm_u: 25.222990 loss: 0.039007 +RANK_0 - 2026-01-29 06:25:33,953 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN - Minibatch 0: weight_norm_model: 143.883469 loss: 0.062272 grad_norm_before_clip: 4.214606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:35,440 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883469 weight_norm_u: 25.218954 loss: 0.062272 grad_norm_before_clip: 4.214606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:35,441 - TRAIN-LOGGER - INFO - Epoch 329 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883469 weight_norm_u: 25.222990 loss: 0.038157 +RANK_0 - 2026-01-29 06:25:42,528 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN - Minibatch 0: weight_norm_model: 143.883469 loss: 0.058891 grad_norm_before_clip: 3.702457 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:44,234 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883469 weight_norm_u: 25.218954 loss: 0.058891 grad_norm_before_clip: 3.702457 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:44,235 - TRAIN-LOGGER - INFO - Epoch 330 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883484 weight_norm_u: 25.222990 loss: 0.041741 +RANK_0 - 2026-01-29 06:25:50,918 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN - Minibatch 0: weight_norm_model: 143.883484 loss: 0.064551 grad_norm_before_clip: 2.755979 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:52,205 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883484 weight_norm_u: 25.218954 loss: 0.064551 grad_norm_before_clip: 2.755979 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:25:52,205 - TRAIN-LOGGER - INFO - Epoch 331 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883484 weight_norm_u: 25.222990 loss: 0.042873 +RANK_0 - 2026-01-29 06:25:59,412 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN - Minibatch 0: weight_norm_model: 143.883484 loss: 0.072774 grad_norm_before_clip: 3.796427 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:01,028 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883484 weight_norm_u: 25.218954 loss: 0.072774 grad_norm_before_clip: 3.796427 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:01,029 - TRAIN-LOGGER - INFO - Epoch 332 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883484 weight_norm_u: 25.222990 loss: 0.040107 +RANK_0 - 2026-01-29 06:26:07,184 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN - Minibatch 0: weight_norm_model: 143.883484 loss: 0.070107 grad_norm_before_clip: 1.724533 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:08,602 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883484 weight_norm_u: 25.218954 loss: 0.070107 grad_norm_before_clip: 1.724533 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:08,603 - TRAIN-LOGGER - INFO - Epoch 333 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883499 weight_norm_u: 25.222990 loss: 0.037485 +RANK_0 - 2026-01-29 06:26:15,354 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN - Minibatch 0: weight_norm_model: 143.883499 loss: 0.066206 grad_norm_before_clip: 2.500867 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:16,731 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883499 weight_norm_u: 25.218954 loss: 0.066206 grad_norm_before_clip: 2.500867 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:16,731 - TRAIN-LOGGER - INFO - Epoch 334 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883530 weight_norm_u: 25.222990 loss: 0.039324 +RANK_0 - 2026-01-29 06:26:22,885 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN - Minibatch 0: weight_norm_model: 143.883530 loss: 0.057163 grad_norm_before_clip: 3.577238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:24,602 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883530 weight_norm_u: 25.218954 loss: 0.057163 grad_norm_before_clip: 3.577238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:24,602 - TRAIN-LOGGER - INFO - Epoch 335 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883530 weight_norm_u: 25.222990 loss: 0.040995 +RANK_0 - 2026-01-29 06:26:30,869 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN - Minibatch 0: weight_norm_model: 143.883530 loss: 0.071439 grad_norm_before_clip: 3.568688 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:32,531 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883530 weight_norm_u: 25.218954 loss: 0.071439 grad_norm_before_clip: 3.568688 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:32,532 - TRAIN-LOGGER - INFO - Epoch 336 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.041243 +RANK_0 - 2026-01-29 06:26:38,328 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.065189 grad_norm_before_clip: 3.814162 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:39,886 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.065189 grad_norm_before_clip: 3.814162 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:39,886 - TRAIN-LOGGER - INFO - Epoch 337 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.039352 +RANK_0 - 2026-01-29 06:26:46,871 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.067411 grad_norm_before_clip: 2.981003 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:48,192 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.067411 grad_norm_before_clip: 2.981003 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:48,192 - TRAIN-LOGGER - INFO - Epoch 338 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.036894 +RANK_0 - 2026-01-29 06:26:55,071 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.067823 grad_norm_before_clip: 2.988628 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:56,847 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.067823 grad_norm_before_clip: 2.988628 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:26:56,847 - TRAIN-LOGGER - INFO - Epoch 339 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.042015 +RANK_0 - 2026-01-29 06:27:03,424 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.076276 grad_norm_before_clip: 6.049209 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:04,600 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.076276 grad_norm_before_clip: 6.049209 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:04,600 - TRAIN-LOGGER - INFO - Epoch 340 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.046517 +RANK_0 - 2026-01-29 06:27:11,262 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.073094 grad_norm_before_clip: 4.843443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:12,701 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.073094 grad_norm_before_clip: 4.843443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:12,702 - TRAIN-LOGGER - INFO - Epoch 341 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883560 weight_norm_u: 25.222990 loss: 0.046067 +RANK_0 - 2026-01-29 06:27:18,925 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN - Minibatch 0: weight_norm_model: 143.883560 loss: 0.076624 grad_norm_before_clip: 4.954204 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:20,568 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883560 weight_norm_u: 25.218954 loss: 0.076624 grad_norm_before_clip: 4.954204 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:20,569 - TRAIN-LOGGER - INFO - Epoch 342 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883575 weight_norm_u: 25.222990 loss: 0.045368 +RANK_0 - 2026-01-29 06:27:26,812 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN - Minibatch 0: weight_norm_model: 143.883575 loss: 0.070498 grad_norm_before_clip: 3.967070 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:28,240 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883575 weight_norm_u: 25.218954 loss: 0.070498 grad_norm_before_clip: 3.967070 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:28,240 - TRAIN-LOGGER - INFO - Epoch 343 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883606 weight_norm_u: 25.222990 loss: 0.042225 +RANK_0 - 2026-01-29 06:27:34,554 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN - Minibatch 0: weight_norm_model: 143.883606 loss: 0.061235 grad_norm_before_clip: 2.613994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:36,005 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883606 weight_norm_u: 25.218954 loss: 0.061235 grad_norm_before_clip: 2.613994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:36,005 - TRAIN-LOGGER - INFO - Epoch 344 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883621 weight_norm_u: 25.222990 loss: 0.037539 +RANK_0 - 2026-01-29 06:27:43,009 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN - Minibatch 0: weight_norm_model: 143.883621 loss: 0.077374 grad_norm_before_clip: 3.184721 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:44,431 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883621 weight_norm_u: 25.218954 loss: 0.077374 grad_norm_before_clip: 3.184721 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:44,431 - TRAIN-LOGGER - INFO - Epoch 345 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883667 weight_norm_u: 25.222990 loss: 0.039658 +RANK_0 - 2026-01-29 06:27:51,219 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN - Minibatch 0: weight_norm_model: 143.883667 loss: 0.064573 grad_norm_before_clip: 4.940575 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:52,530 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883667 weight_norm_u: 25.218954 loss: 0.064573 grad_norm_before_clip: 4.940575 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:27:52,530 - TRAIN-LOGGER - INFO - Epoch 346 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883682 weight_norm_u: 25.222990 loss: 0.044311 +RANK_0 - 2026-01-29 06:27:59,265 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN - Minibatch 0: weight_norm_model: 143.883682 loss: 0.070070 grad_norm_before_clip: 4.656394 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:01,150 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883682 weight_norm_u: 25.218954 loss: 0.070070 grad_norm_before_clip: 4.656394 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:01,151 - TRAIN-LOGGER - INFO - Epoch 347 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883682 weight_norm_u: 25.222990 loss: 0.045403 +RANK_0 - 2026-01-29 06:28:07,378 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN - Minibatch 0: weight_norm_model: 143.883682 loss: 0.077100 grad_norm_before_clip: 4.053572 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:09,192 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883682 weight_norm_u: 25.218954 loss: 0.077100 grad_norm_before_clip: 4.053572 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:09,192 - TRAIN-LOGGER - INFO - Epoch 348 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883682 weight_norm_u: 25.222990 loss: 0.043521 +RANK_0 - 2026-01-29 06:28:15,307 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN - Minibatch 0: weight_norm_model: 143.883682 loss: 0.064768 grad_norm_before_clip: 3.730318 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:16,830 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883682 weight_norm_u: 25.218954 loss: 0.064768 grad_norm_before_clip: 3.730318 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:16,830 - TRAIN-LOGGER - INFO - Epoch 349 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883667 weight_norm_u: 25.222990 loss: 0.039916 +RANK_0 - 2026-01-29 06:28:23,770 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN - Minibatch 0: weight_norm_model: 143.883667 loss: 0.064763 grad_norm_before_clip: 4.945670 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:25,031 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883667 weight_norm_u: 25.218954 loss: 0.064763 grad_norm_before_clip: 4.945670 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:25,031 - TRAIN-LOGGER - INFO - Epoch 350 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883636 weight_norm_u: 25.222990 loss: 0.039628 +RANK_0 - 2026-01-29 06:28:31,939 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN - Minibatch 0: weight_norm_model: 143.883636 loss: 0.071114 grad_norm_before_clip: 3.731550 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:33,393 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883636 weight_norm_u: 25.218954 loss: 0.071114 grad_norm_before_clip: 3.731550 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:33,393 - TRAIN-LOGGER - INFO - Epoch 351 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883621 weight_norm_u: 25.222990 loss: 0.043943 +RANK_0 - 2026-01-29 06:28:39,856 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN - Minibatch 0: weight_norm_model: 143.883621 loss: 0.065463 grad_norm_before_clip: 4.242713 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:41,495 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883621 weight_norm_u: 25.218954 loss: 0.065463 grad_norm_before_clip: 4.242713 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:41,495 - TRAIN-LOGGER - INFO - Epoch 352 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883621 weight_norm_u: 25.222990 loss: 0.045825 +RANK_0 - 2026-01-29 06:28:48,271 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN - Minibatch 0: weight_norm_model: 143.883621 loss: 0.074032 grad_norm_before_clip: 4.269428 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:49,832 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883621 weight_norm_u: 25.218954 loss: 0.074032 grad_norm_before_clip: 4.269428 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:49,832 - TRAIN-LOGGER - INFO - Epoch 353 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883636 weight_norm_u: 25.222990 loss: 0.041133 +RANK_0 - 2026-01-29 06:28:57,052 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN - Minibatch 0: weight_norm_model: 143.883636 loss: 0.063130 grad_norm_before_clip: 4.175549 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:58,407 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883636 weight_norm_u: 25.218954 loss: 0.063130 grad_norm_before_clip: 4.175549 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:28:58,407 - TRAIN-LOGGER - INFO - Epoch 354 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883667 weight_norm_u: 25.222990 loss: 0.035827 +RANK_0 - 2026-01-29 06:29:05,498 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN - Minibatch 0: weight_norm_model: 143.883667 loss: 0.062613 grad_norm_before_clip: 2.452325 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:06,797 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883667 weight_norm_u: 25.218954 loss: 0.062613 grad_norm_before_clip: 2.452325 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:06,797 - TRAIN-LOGGER - INFO - Epoch 355 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883713 weight_norm_u: 25.222990 loss: 0.040364 +RANK_0 - 2026-01-29 06:29:13,102 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN - Minibatch 0: weight_norm_model: 143.883713 loss: 0.067075 grad_norm_before_clip: 5.119182 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:14,650 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883713 weight_norm_u: 25.218954 loss: 0.067075 grad_norm_before_clip: 5.119182 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:14,651 - TRAIN-LOGGER - INFO - Epoch 356 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883743 weight_norm_u: 25.222990 loss: 0.047305 +RANK_0 - 2026-01-29 06:29:21,537 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN - Minibatch 0: weight_norm_model: 143.883743 loss: 0.075308 grad_norm_before_clip: 5.531221 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:22,749 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883743 weight_norm_u: 25.218954 loss: 0.075308 grad_norm_before_clip: 5.531221 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:22,749 - TRAIN-LOGGER - INFO - Epoch 357 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883743 weight_norm_u: 25.222990 loss: 0.047288 +RANK_0 - 2026-01-29 06:29:30,188 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN - Minibatch 0: weight_norm_model: 143.883743 loss: 0.075458 grad_norm_before_clip: 3.685409 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:31,853 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883743 weight_norm_u: 25.218954 loss: 0.075458 grad_norm_before_clip: 3.685409 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:31,853 - TRAIN-LOGGER - INFO - Epoch 358 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883728 weight_norm_u: 25.222990 loss: 0.042856 +RANK_0 - 2026-01-29 06:29:38,423 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN - Minibatch 0: weight_norm_model: 143.883728 loss: 0.072801 grad_norm_before_clip: 6.269476 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:39,975 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883728 weight_norm_u: 25.218954 loss: 0.072801 grad_norm_before_clip: 6.269476 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:39,975 - TRAIN-LOGGER - INFO - Epoch 359 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883698 weight_norm_u: 25.222990 loss: 0.040751 +RANK_0 - 2026-01-29 06:29:46,135 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN - Minibatch 0: weight_norm_model: 143.883698 loss: 0.071944 grad_norm_before_clip: 3.707925 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:47,592 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883698 weight_norm_u: 25.218954 loss: 0.071944 grad_norm_before_clip: 3.707925 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:47,592 - TRAIN-LOGGER - INFO - Epoch 360 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883682 weight_norm_u: 25.222990 loss: 0.042372 +RANK_0 - 2026-01-29 06:29:54,190 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN - Minibatch 0: weight_norm_model: 143.883682 loss: 0.060467 grad_norm_before_clip: 2.705796 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:55,520 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883682 weight_norm_u: 25.218954 loss: 0.060467 grad_norm_before_clip: 2.705796 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:29:55,521 - TRAIN-LOGGER - INFO - Epoch 361 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883667 weight_norm_u: 25.222990 loss: 0.043660 +RANK_0 - 2026-01-29 06:30:01,875 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN - Minibatch 0: weight_norm_model: 143.883667 loss: 0.069036 grad_norm_before_clip: 5.062470 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:03,138 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883667 weight_norm_u: 25.218954 loss: 0.069036 grad_norm_before_clip: 5.062470 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:03,139 - TRAIN-LOGGER - INFO - Epoch 362 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883667 weight_norm_u: 25.222990 loss: 0.041285 +RANK_0 - 2026-01-29 06:30:09,221 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN - Minibatch 0: weight_norm_model: 143.883667 loss: 0.070965 grad_norm_before_clip: 5.644104 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:10,857 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883667 weight_norm_u: 25.218954 loss: 0.070965 grad_norm_before_clip: 5.644104 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:10,857 - TRAIN-LOGGER - INFO - Epoch 363 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883682 weight_norm_u: 25.222990 loss: 0.037692 +RANK_0 - 2026-01-29 06:30:17,478 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN - Minibatch 0: weight_norm_model: 143.883682 loss: 0.071273 grad_norm_before_clip: 3.179399 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:19,023 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883682 weight_norm_u: 25.218954 loss: 0.071273 grad_norm_before_clip: 3.179399 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:19,024 - TRAIN-LOGGER - INFO - Epoch 364 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883728 weight_norm_u: 25.222990 loss: 0.041734 +RANK_0 - 2026-01-29 06:30:25,720 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN - Minibatch 0: weight_norm_model: 143.883728 loss: 0.061298 grad_norm_before_clip: 5.038080 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:27,438 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883728 weight_norm_u: 25.218954 loss: 0.061298 grad_norm_before_clip: 5.038080 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:27,439 - TRAIN-LOGGER - INFO - Epoch 365 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.047772 +RANK_0 - 2026-01-29 06:30:33,853 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.081242 grad_norm_before_clip: 7.236573 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:35,377 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.081242 grad_norm_before_clip: 7.236573 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:35,377 - TRAIN-LOGGER - INFO - Epoch 366 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.048147 +RANK_0 - 2026-01-29 06:30:41,796 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.072050 grad_norm_before_clip: 4.149615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:43,038 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.072050 grad_norm_before_clip: 4.149615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:43,038 - TRAIN-LOGGER - INFO - Epoch 367 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.044764 +RANK_0 - 2026-01-29 06:30:50,275 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.074511 grad_norm_before_clip: 3.706291 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:51,466 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.074511 grad_norm_before_clip: 3.706291 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:30:51,467 - TRAIN-LOGGER - INFO - Epoch 368 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.040604 +RANK_0 - 2026-01-29 06:30:59,213 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.063996 grad_norm_before_clip: 4.632854 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:00,727 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.063996 grad_norm_before_clip: 4.632854 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:00,727 - TRAIN-LOGGER - INFO - Epoch 369 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883728 weight_norm_u: 25.222990 loss: 0.042833 +RANK_0 - 2026-01-29 06:31:07,168 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN - Minibatch 0: weight_norm_model: 143.883728 loss: 0.064547 grad_norm_before_clip: 4.630463 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:08,758 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883728 weight_norm_u: 25.218954 loss: 0.064547 grad_norm_before_clip: 4.630463 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:08,759 - TRAIN-LOGGER - INFO - Epoch 370 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883728 weight_norm_u: 25.222990 loss: 0.046312 +RANK_0 - 2026-01-29 06:31:14,869 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN - Minibatch 0: weight_norm_model: 143.883728 loss: 0.077274 grad_norm_before_clip: 4.234354 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:16,240 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883728 weight_norm_u: 25.218954 loss: 0.077274 grad_norm_before_clip: 4.234354 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:16,240 - TRAIN-LOGGER - INFO - Epoch 371 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883743 weight_norm_u: 25.222990 loss: 0.047238 +RANK_0 - 2026-01-29 06:31:23,348 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN - Minibatch 0: weight_norm_model: 143.883743 loss: 0.077607 grad_norm_before_clip: 5.610840 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:24,652 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883743 weight_norm_u: 25.218954 loss: 0.077607 grad_norm_before_clip: 5.610840 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:24,652 - TRAIN-LOGGER - INFO - Epoch 372 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.047683 +RANK_0 - 2026-01-29 06:31:30,879 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.072558 grad_norm_before_clip: 3.656278 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:32,443 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.072558 grad_norm_before_clip: 3.656278 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:32,444 - TRAIN-LOGGER - INFO - Epoch 373 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.046844 +RANK_0 - 2026-01-29 06:31:38,047 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.068121 grad_norm_before_clip: 5.648566 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:39,438 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.068121 grad_norm_before_clip: 5.648566 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:39,439 - TRAIN-LOGGER - INFO - Epoch 374 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.043321 +RANK_0 - 2026-01-29 06:31:46,004 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.069183 grad_norm_before_clip: 6.029124 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:47,531 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.069183 grad_norm_before_clip: 6.029124 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:47,532 - TRAIN-LOGGER - INFO - Epoch 375 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883835 weight_norm_u: 25.222990 loss: 0.042054 +RANK_0 - 2026-01-29 06:31:53,917 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN - Minibatch 0: weight_norm_model: 143.883835 loss: 0.064699 grad_norm_before_clip: 4.557192 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:55,509 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883835 weight_norm_u: 25.218954 loss: 0.064699 grad_norm_before_clip: 4.557192 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:31:55,510 - TRAIN-LOGGER - INFO - Epoch 376 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.043478 +RANK_0 - 2026-01-29 06:32:02,460 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.057806 grad_norm_before_clip: 2.917084 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:03,862 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.057806 grad_norm_before_clip: 2.917084 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:03,862 - TRAIN-LOGGER - INFO - Epoch 377 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883804 weight_norm_u: 25.222990 loss: 0.045296 +RANK_0 - 2026-01-29 06:32:10,709 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN - Minibatch 0: weight_norm_model: 143.883804 loss: 0.072428 grad_norm_before_clip: 5.244622 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:12,329 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883804 weight_norm_u: 25.218954 loss: 0.072428 grad_norm_before_clip: 5.244622 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:12,329 - TRAIN-LOGGER - INFO - Epoch 378 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.045612 +RANK_0 - 2026-01-29 06:32:18,909 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.075279 grad_norm_before_clip: 5.544892 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:20,265 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.075279 grad_norm_before_clip: 5.544892 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:20,265 - TRAIN-LOGGER - INFO - Epoch 379 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.043471 +RANK_0 - 2026-01-29 06:32:27,093 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.065005 grad_norm_before_clip: 4.004513 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:28,892 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.065005 grad_norm_before_clip: 4.004513 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:28,893 - TRAIN-LOGGER - INFO - Epoch 380 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883743 weight_norm_u: 25.222990 loss: 0.041148 +RANK_0 - 2026-01-29 06:32:35,753 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN - Minibatch 0: weight_norm_model: 143.883743 loss: 0.057333 grad_norm_before_clip: 4.889503 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:37,196 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883743 weight_norm_u: 25.218954 loss: 0.057333 grad_norm_before_clip: 4.889503 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:37,196 - TRAIN-LOGGER - INFO - Epoch 381 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883728 weight_norm_u: 25.222990 loss: 0.043700 +RANK_0 - 2026-01-29 06:32:43,585 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN - Minibatch 0: weight_norm_model: 143.883728 loss: 0.070171 grad_norm_before_clip: 6.078573 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:44,911 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883728 weight_norm_u: 25.218954 loss: 0.070171 grad_norm_before_clip: 6.078573 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:44,912 - TRAIN-LOGGER - INFO - Epoch 382 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.046404 +RANK_0 - 2026-01-29 06:32:51,215 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.068571 grad_norm_before_clip: 5.070679 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:52,904 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.068571 grad_norm_before_clip: 5.070679 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:32:52,904 - TRAIN-LOGGER - INFO - Epoch 383 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.048548 +RANK_0 - 2026-01-29 06:33:00,485 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.065263 grad_norm_before_clip: 4.785520 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:02,027 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.065263 grad_norm_before_clip: 4.785520 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:02,027 - TRAIN-LOGGER - INFO - Epoch 384 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.047339 +RANK_0 - 2026-01-29 06:33:08,639 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.071569 grad_norm_before_clip: 5.918777 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:10,327 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.071569 grad_norm_before_clip: 5.918777 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:10,327 - TRAIN-LOGGER - INFO - Epoch 385 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.046911 +RANK_0 - 2026-01-29 06:33:17,090 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.063730 grad_norm_before_clip: 4.588505 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:18,729 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.063730 grad_norm_before_clip: 4.588505 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:18,730 - TRAIN-LOGGER - INFO - Epoch 386 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883865 weight_norm_u: 25.222990 loss: 0.046310 +RANK_0 - 2026-01-29 06:33:25,440 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN - Minibatch 0: weight_norm_model: 143.883865 loss: 0.072765 grad_norm_before_clip: 6.860919 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:26,784 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883865 weight_norm_u: 25.218954 loss: 0.072765 grad_norm_before_clip: 6.860919 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:26,784 - TRAIN-LOGGER - INFO - Epoch 387 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.044334 +RANK_0 - 2026-01-29 06:33:33,501 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.058506 grad_norm_before_clip: 3.376342 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:35,016 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.058506 grad_norm_before_clip: 3.376342 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:35,017 - TRAIN-LOGGER - INFO - Epoch 388 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883835 weight_norm_u: 25.222990 loss: 0.046345 +RANK_0 - 2026-01-29 06:33:41,062 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN - Minibatch 0: weight_norm_model: 143.883835 loss: 0.064992 grad_norm_before_clip: 4.453968 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:42,448 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883835 weight_norm_u: 25.218954 loss: 0.064992 grad_norm_before_clip: 4.453968 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:42,448 - TRAIN-LOGGER - INFO - Epoch 389 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.049782 +RANK_0 - 2026-01-29 06:33:48,676 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.075416 grad_norm_before_clip: 5.160914 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:50,392 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.075416 grad_norm_before_clip: 5.160914 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:50,393 - TRAIN-LOGGER - INFO - Epoch 390 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.050321 +RANK_0 - 2026-01-29 06:33:56,998 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.067155 grad_norm_before_clip: 4.904115 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:58,467 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.067155 grad_norm_before_clip: 4.904115 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:33:58,467 - TRAIN-LOGGER - INFO - Epoch 391 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.046021 +RANK_0 - 2026-01-29 06:34:05,485 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.074112 grad_norm_before_clip: 3.937498 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:06,768 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.074112 grad_norm_before_clip: 3.937498 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:06,768 - TRAIN-LOGGER - INFO - Epoch 392 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.038259 +RANK_0 - 2026-01-29 06:34:13,369 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.065922 grad_norm_before_clip: 2.829703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:15,088 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.065922 grad_norm_before_clip: 2.829703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:15,088 - TRAIN-LOGGER - INFO - Epoch 393 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.036092 +RANK_0 - 2026-01-29 06:34:20,448 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.053923 grad_norm_before_clip: 2.179358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:21,854 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.053923 grad_norm_before_clip: 2.179358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:21,855 - TRAIN-LOGGER - INFO - Epoch 394 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883881 weight_norm_u: 25.222990 loss: 0.043010 +RANK_0 - 2026-01-29 06:34:28,815 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN - Minibatch 0: weight_norm_model: 143.883881 loss: 0.070252 grad_norm_before_clip: 2.867358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:30,540 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883881 weight_norm_u: 25.218954 loss: 0.070252 grad_norm_before_clip: 2.867358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:30,540 - TRAIN-LOGGER - INFO - Epoch 395 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883896 weight_norm_u: 25.222990 loss: 0.047955 +RANK_0 - 2026-01-29 06:34:37,020 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN - Minibatch 0: weight_norm_model: 143.883896 loss: 0.068657 grad_norm_before_clip: 4.898356 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:38,543 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883896 weight_norm_u: 25.218954 loss: 0.068657 grad_norm_before_clip: 4.898356 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:38,543 - TRAIN-LOGGER - INFO - Epoch 396 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883896 weight_norm_u: 25.222990 loss: 0.046810 +RANK_0 - 2026-01-29 06:34:44,340 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN - Minibatch 0: weight_norm_model: 143.883896 loss: 0.064263 grad_norm_before_clip: 6.633598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:45,953 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883896 weight_norm_u: 25.218954 loss: 0.064263 grad_norm_before_clip: 6.633598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:45,953 - TRAIN-LOGGER - INFO - Epoch 397 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883881 weight_norm_u: 25.222990 loss: 0.040218 +RANK_0 - 2026-01-29 06:34:51,927 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN - Minibatch 0: weight_norm_model: 143.883881 loss: 0.072027 grad_norm_before_clip: 4.478304 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:53,358 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883881 weight_norm_u: 25.218954 loss: 0.072027 grad_norm_before_clip: 4.478304 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:34:53,358 - TRAIN-LOGGER - INFO - Epoch 398 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.034073 +RANK_0 - 2026-01-29 06:35:00,267 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.069307 grad_norm_before_clip: 4.388728 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:01,664 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.069307 grad_norm_before_clip: 4.388728 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:01,664 - TRAIN-LOGGER - INFO - Epoch 399 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.039111 +RANK_0 - 2026-01-29 06:35:08,801 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.066878 grad_norm_before_clip: 3.960065 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:10,387 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.066878 grad_norm_before_clip: 3.960065 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 06:35:10,388 - TRAIN-LOGGER - INFO - Epoch 400 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.050184