diff --git "a/vdp2/vdp2_01-29-0223/logging/train.log" "b/vdp2/vdp2_01-29-0223/logging/train.log" new file mode 100644--- /dev/null +++ "b/vdp2/vdp2_01-29-0223/logging/train.log" @@ -0,0 +1,2400 @@ +RANK_0 - 2026-01-29 02:23:57,972 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 1.158142 grad_norm_before_clip: 15.064606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:23:59,222 - TRAIN-LOGGER - INFO - Epoch 201 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 1.158142 grad_norm_before_clip: 15.064606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:23:59,223 - TRAIN-LOGGER - INFO - Epoch 201 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882385 weight_norm_u: 25.222990 loss: 1.049163 +RANK_0 - 2026-01-29 02:24:04,772 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN - Minibatch 0: weight_norm_model: 143.882385 loss: 1.049163 grad_norm_before_clip: 6.827514 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:05,971 - TRAIN-LOGGER - INFO - Epoch 202 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882385 weight_norm_u: 25.218954 loss: 1.049163 grad_norm_before_clip: 6.827514 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:05,971 - TRAIN-LOGGER - INFO - Epoch 202 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882263 weight_norm_u: 25.222990 loss: 1.051041 +RANK_0 - 2026-01-29 02:24:11,424 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN - Minibatch 0: weight_norm_model: 143.882263 loss: 1.051041 grad_norm_before_clip: 6.002395 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:12,588 - TRAIN-LOGGER - INFO - Epoch 203 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882263 weight_norm_u: 25.218954 loss: 1.051041 grad_norm_before_clip: 6.002395 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:12,589 - TRAIN-LOGGER - INFO - Epoch 203 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882202 weight_norm_u: 25.222990 loss: 1.051009 +RANK_0 - 2026-01-29 02:24:17,671 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN - Minibatch 0: weight_norm_model: 143.882202 loss: 1.051009 grad_norm_before_clip: 8.895806 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:19,023 - TRAIN-LOGGER - INFO - Epoch 204 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882202 weight_norm_u: 25.218954 loss: 1.051009 grad_norm_before_clip: 8.895806 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:19,023 - TRAIN-LOGGER - INFO - Epoch 204 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882202 weight_norm_u: 25.222990 loss: 1.033557 +RANK_0 - 2026-01-29 02:24:23,473 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN - Minibatch 0: weight_norm_model: 143.882202 loss: 1.033557 grad_norm_before_clip: 6.625247 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:24,595 - TRAIN-LOGGER - INFO - Epoch 205 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882202 weight_norm_u: 25.218954 loss: 1.033557 grad_norm_before_clip: 6.625247 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:24,595 - TRAIN-LOGGER - INFO - Epoch 205 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882217 weight_norm_u: 25.222990 loss: 1.014428 +RANK_0 - 2026-01-29 02:24:29,483 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN - Minibatch 0: weight_norm_model: 143.882217 loss: 1.014428 grad_norm_before_clip: 4.224920 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:30,716 - TRAIN-LOGGER - INFO - Epoch 206 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882217 weight_norm_u: 25.218954 loss: 1.014428 grad_norm_before_clip: 4.224920 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:30,716 - TRAIN-LOGGER - INFO - Epoch 206 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882263 weight_norm_u: 25.222990 loss: 1.018200 +RANK_0 - 2026-01-29 02:24:35,319 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN - Minibatch 0: weight_norm_model: 143.882263 loss: 1.018200 grad_norm_before_clip: 5.329910 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:36,544 - TRAIN-LOGGER - INFO - Epoch 207 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882263 weight_norm_u: 25.218954 loss: 1.018200 grad_norm_before_clip: 5.329910 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:36,544 - TRAIN-LOGGER - INFO - Epoch 207 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882278 weight_norm_u: 25.222990 loss: 1.023750 +RANK_0 - 2026-01-29 02:24:40,971 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN - Minibatch 0: weight_norm_model: 143.882278 loss: 1.023750 grad_norm_before_clip: 7.797914 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:42,174 - TRAIN-LOGGER - INFO - Epoch 208 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882278 weight_norm_u: 25.218954 loss: 1.023750 grad_norm_before_clip: 7.797914 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:42,174 - TRAIN-LOGGER - INFO - Epoch 208 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882278 weight_norm_u: 25.222990 loss: 1.017168 +RANK_0 - 2026-01-29 02:24:47,064 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN - Minibatch 0: weight_norm_model: 143.882278 loss: 1.017168 grad_norm_before_clip: 8.033554 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:48,388 - TRAIN-LOGGER - INFO - Epoch 209 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882278 weight_norm_u: 25.218954 loss: 1.017168 grad_norm_before_clip: 8.033554 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:48,388 - TRAIN-LOGGER - INFO - Epoch 209 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882263 weight_norm_u: 25.222990 loss: 1.005317 +RANK_0 - 2026-01-29 02:24:53,265 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN - Minibatch 0: weight_norm_model: 143.882263 loss: 1.005317 grad_norm_before_clip: 4.729166 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:54,580 - TRAIN-LOGGER - INFO - Epoch 210 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882263 weight_norm_u: 25.218954 loss: 1.005317 grad_norm_before_clip: 4.729166 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:24:54,581 - TRAIN-LOGGER - INFO - Epoch 210 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882202 weight_norm_u: 25.222990 loss: 1.002940 +RANK_0 - 2026-01-29 02:25:00,184 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN - Minibatch 0: weight_norm_model: 143.882202 loss: 1.002940 grad_norm_before_clip: 3.862727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:01,294 - TRAIN-LOGGER - INFO - Epoch 211 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882202 weight_norm_u: 25.218954 loss: 1.002940 grad_norm_before_clip: 3.862727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:01,295 - TRAIN-LOGGER - INFO - Epoch 211 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 1.007749 +RANK_0 - 2026-01-29 02:25:05,791 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 1.007749 grad_norm_before_clip: 4.917280 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:06,911 - TRAIN-LOGGER - INFO - Epoch 212 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 1.007749 grad_norm_before_clip: 4.917280 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:06,911 - TRAIN-LOGGER - INFO - Epoch 212 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 1.006944 +RANK_0 - 2026-01-29 02:25:11,482 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 1.006944 grad_norm_before_clip: 4.947704 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:12,715 - TRAIN-LOGGER - INFO - Epoch 213 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 1.006944 grad_norm_before_clip: 4.947704 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:12,716 - TRAIN-LOGGER - INFO - Epoch 213 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882202 weight_norm_u: 25.222990 loss: 0.998565 +RANK_0 - 2026-01-29 02:25:17,588 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN - Minibatch 0: weight_norm_model: 143.882202 loss: 0.998565 grad_norm_before_clip: 2.925486 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:19,030 - TRAIN-LOGGER - INFO - Epoch 214 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882202 weight_norm_u: 25.218954 loss: 0.998565 grad_norm_before_clip: 2.925486 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:19,030 - TRAIN-LOGGER - INFO - Epoch 214 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882217 weight_norm_u: 25.222990 loss: 0.994695 +RANK_0 - 2026-01-29 02:25:24,136 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN - Minibatch 0: weight_norm_model: 143.882217 loss: 0.994695 grad_norm_before_clip: 1.054446 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:25,352 - TRAIN-LOGGER - INFO - Epoch 215 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882217 weight_norm_u: 25.218954 loss: 0.994695 grad_norm_before_clip: 1.054446 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:25,352 - TRAIN-LOGGER - INFO - Epoch 215 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882233 weight_norm_u: 25.222990 loss: 1.000306 +RANK_0 - 2026-01-29 02:25:30,432 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN - Minibatch 0: weight_norm_model: 143.882233 loss: 1.000306 grad_norm_before_clip: 5.237498 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:31,582 - TRAIN-LOGGER - INFO - Epoch 216 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882233 weight_norm_u: 25.218954 loss: 1.000306 grad_norm_before_clip: 5.237498 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:31,582 - TRAIN-LOGGER - INFO - Epoch 216 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882233 weight_norm_u: 25.222990 loss: 1.001533 +RANK_0 - 2026-01-29 02:25:37,232 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN - Minibatch 0: weight_norm_model: 143.882233 loss: 1.001533 grad_norm_before_clip: 4.896365 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:38,631 - TRAIN-LOGGER - INFO - Epoch 217 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882233 weight_norm_u: 25.218954 loss: 1.001533 grad_norm_before_clip: 4.896365 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:38,631 - TRAIN-LOGGER - INFO - Epoch 217 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882217 weight_norm_u: 25.222990 loss: 0.998840 +RANK_0 - 2026-01-29 02:25:42,854 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN - Minibatch 0: weight_norm_model: 143.882217 loss: 0.998840 grad_norm_before_clip: 3.220479 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:44,066 - TRAIN-LOGGER - INFO - Epoch 218 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882217 weight_norm_u: 25.218954 loss: 0.998840 grad_norm_before_clip: 3.220479 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:44,066 - TRAIN-LOGGER - INFO - Epoch 218 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 0.996641 +RANK_0 - 2026-01-29 02:25:48,915 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 0.996641 grad_norm_before_clip: 2.295606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:50,051 - TRAIN-LOGGER - INFO - Epoch 219 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 0.996641 grad_norm_before_clip: 2.295606 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:50,051 - TRAIN-LOGGER - INFO - Epoch 219 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882172 weight_norm_u: 25.222990 loss: 0.996054 +RANK_0 - 2026-01-29 02:25:54,477 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN - Minibatch 0: weight_norm_model: 143.882172 loss: 0.996054 grad_norm_before_clip: 2.663164 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:55,696 - TRAIN-LOGGER - INFO - Epoch 220 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882172 weight_norm_u: 25.218954 loss: 0.996054 grad_norm_before_clip: 2.663164 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:25:55,696 - TRAIN-LOGGER - INFO - Epoch 220 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882172 weight_norm_u: 25.222990 loss: 0.995019 +RANK_0 - 2026-01-29 02:26:00,163 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN - Minibatch 0: weight_norm_model: 143.882172 loss: 0.995019 grad_norm_before_clip: 2.934274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:01,367 - TRAIN-LOGGER - INFO - Epoch 221 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882172 weight_norm_u: 25.218954 loss: 0.995019 grad_norm_before_clip: 2.934274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:01,367 - TRAIN-LOGGER - INFO - Epoch 221 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 0.995861 +RANK_0 - 2026-01-29 02:26:05,928 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 0.995861 grad_norm_before_clip: 2.390234 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:07,144 - TRAIN-LOGGER - INFO - Epoch 222 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 0.995861 grad_norm_before_clip: 2.390234 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:07,144 - TRAIN-LOGGER - INFO - Epoch 222 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 0.995670 +RANK_0 - 2026-01-29 02:26:11,582 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 0.995670 grad_norm_before_clip: 3.676242 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:12,751 - TRAIN-LOGGER - INFO - Epoch 223 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 0.995670 grad_norm_before_clip: 3.676242 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:12,751 - TRAIN-LOGGER - INFO - Epoch 223 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 0.993564 +RANK_0 - 2026-01-29 02:26:17,715 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 0.993564 grad_norm_before_clip: 2.452753 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:18,962 - TRAIN-LOGGER - INFO - Epoch 224 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 0.993564 grad_norm_before_clip: 2.452753 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:18,962 - TRAIN-LOGGER - INFO - Epoch 224 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882156 weight_norm_u: 25.222990 loss: 0.991864 +RANK_0 - 2026-01-29 02:26:23,807 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN - Minibatch 0: weight_norm_model: 143.882156 loss: 0.991864 grad_norm_before_clip: 1.315581 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:25,058 - TRAIN-LOGGER - INFO - Epoch 225 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882156 weight_norm_u: 25.218954 loss: 0.991864 grad_norm_before_clip: 1.315581 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:25,059 - TRAIN-LOGGER - INFO - Epoch 225 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882156 weight_norm_u: 25.222990 loss: 0.991166 +RANK_0 - 2026-01-29 02:26:30,259 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN - Minibatch 0: weight_norm_model: 143.882156 loss: 0.991166 grad_norm_before_clip: 1.970792 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:31,517 - TRAIN-LOGGER - INFO - Epoch 226 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882156 weight_norm_u: 25.218954 loss: 0.991166 grad_norm_before_clip: 1.970792 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:31,517 - TRAIN-LOGGER - INFO - Epoch 226 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882172 weight_norm_u: 25.222990 loss: 0.992331 +RANK_0 - 2026-01-29 02:26:35,773 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN - Minibatch 0: weight_norm_model: 143.882172 loss: 0.992331 grad_norm_before_clip: 3.100587 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:37,114 - TRAIN-LOGGER - INFO - Epoch 227 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882172 weight_norm_u: 25.218954 loss: 0.992331 grad_norm_before_clip: 3.100587 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:37,114 - TRAIN-LOGGER - INFO - Epoch 227 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882172 weight_norm_u: 25.222990 loss: 0.992201 +RANK_0 - 2026-01-29 02:26:41,654 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN - Minibatch 0: weight_norm_model: 143.882172 loss: 0.992201 grad_norm_before_clip: 2.995393 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:42,818 - TRAIN-LOGGER - INFO - Epoch 228 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882172 weight_norm_u: 25.218954 loss: 0.992201 grad_norm_before_clip: 2.995393 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:42,818 - TRAIN-LOGGER - INFO - Epoch 228 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882156 weight_norm_u: 25.222990 loss: 0.990950 +RANK_0 - 2026-01-29 02:26:48,514 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN - Minibatch 0: weight_norm_model: 143.882156 loss: 0.990950 grad_norm_before_clip: 2.100479 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:49,737 - TRAIN-LOGGER - INFO - Epoch 229 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882156 weight_norm_u: 25.218954 loss: 0.990950 grad_norm_before_clip: 2.100479 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:49,738 - TRAIN-LOGGER - INFO - Epoch 229 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882141 weight_norm_u: 25.222990 loss: 0.990939 +RANK_0 - 2026-01-29 02:26:54,810 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN - Minibatch 0: weight_norm_model: 143.882141 loss: 0.990939 grad_norm_before_clip: 1.901257 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:56,036 - TRAIN-LOGGER - INFO - Epoch 230 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882141 weight_norm_u: 25.218954 loss: 0.990939 grad_norm_before_clip: 1.901257 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:26:56,036 - TRAIN-LOGGER - INFO - Epoch 230 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882156 weight_norm_u: 25.222990 loss: 0.988540 +RANK_0 - 2026-01-29 02:27:01,471 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN - Minibatch 0: weight_norm_model: 143.882156 loss: 0.988540 grad_norm_before_clip: 1.387248 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:02,617 - TRAIN-LOGGER - INFO - Epoch 231 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882156 weight_norm_u: 25.218954 loss: 0.988540 grad_norm_before_clip: 1.387248 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:02,617 - TRAIN-LOGGER - INFO - Epoch 231 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 0.992316 +RANK_0 - 2026-01-29 02:27:07,175 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 0.992316 grad_norm_before_clip: 4.561409 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:08,677 - TRAIN-LOGGER - INFO - Epoch 232 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 0.992316 grad_norm_before_clip: 4.561409 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:08,678 - TRAIN-LOGGER - INFO - Epoch 232 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882202 weight_norm_u: 25.222990 loss: 0.993853 +RANK_0 - 2026-01-29 02:27:12,876 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN - Minibatch 0: weight_norm_model: 143.882202 loss: 0.993853 grad_norm_before_clip: 4.469794 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:14,061 - TRAIN-LOGGER - INFO - Epoch 233 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882202 weight_norm_u: 25.218954 loss: 0.993853 grad_norm_before_clip: 4.469794 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:14,061 - TRAIN-LOGGER - INFO - Epoch 233 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882187 weight_norm_u: 25.222990 loss: 0.991559 +RANK_0 - 2026-01-29 02:27:18,892 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN - Minibatch 0: weight_norm_model: 143.882187 loss: 0.991559 grad_norm_before_clip: 3.345315 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:20,145 - TRAIN-LOGGER - INFO - Epoch 234 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882187 weight_norm_u: 25.218954 loss: 0.991559 grad_norm_before_clip: 3.345315 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:20,146 - TRAIN-LOGGER - INFO - Epoch 234 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882172 weight_norm_u: 25.222990 loss: 0.990039 +RANK_0 - 2026-01-29 02:27:24,652 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN - Minibatch 0: weight_norm_model: 143.882172 loss: 0.990039 grad_norm_before_clip: 1.298661 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:25,848 - TRAIN-LOGGER - INFO - Epoch 235 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882172 weight_norm_u: 25.218954 loss: 0.990039 grad_norm_before_clip: 1.298661 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:25,848 - TRAIN-LOGGER - INFO - Epoch 235 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882156 weight_norm_u: 25.222990 loss: 0.993080 +RANK_0 - 2026-01-29 02:27:30,433 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN - Minibatch 0: weight_norm_model: 143.882156 loss: 0.993080 grad_norm_before_clip: 4.050813 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:31,561 - TRAIN-LOGGER - INFO - Epoch 236 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882156 weight_norm_u: 25.218954 loss: 0.993080 grad_norm_before_clip: 4.050813 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:31,561 - TRAIN-LOGGER - INFO - Epoch 236 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882156 weight_norm_u: 25.222990 loss: 0.993422 +RANK_0 - 2026-01-29 02:27:36,240 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN - Minibatch 0: weight_norm_model: 143.882156 loss: 0.993422 grad_norm_before_clip: 4.240654 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:37,368 - TRAIN-LOGGER - INFO - Epoch 237 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882156 weight_norm_u: 25.218954 loss: 0.993422 grad_norm_before_clip: 4.240654 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:37,368 - TRAIN-LOGGER - INFO - Epoch 237 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882172 weight_norm_u: 25.222990 loss: 0.990268 +RANK_0 - 2026-01-29 02:27:41,969 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN - Minibatch 0: weight_norm_model: 143.882172 loss: 0.990268 grad_norm_before_clip: 2.975950 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:43,181 - TRAIN-LOGGER - INFO - Epoch 238 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882172 weight_norm_u: 25.218954 loss: 0.990268 grad_norm_before_clip: 2.975950 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:43,181 - TRAIN-LOGGER - INFO - Epoch 238 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882202 weight_norm_u: 25.222990 loss: 0.986767 +RANK_0 - 2026-01-29 02:27:47,974 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN - Minibatch 0: weight_norm_model: 143.882202 loss: 0.986767 grad_norm_before_clip: 2.663596 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:49,106 - TRAIN-LOGGER - INFO - Epoch 239 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882202 weight_norm_u: 25.218954 loss: 0.986767 grad_norm_before_clip: 2.663596 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:49,106 - TRAIN-LOGGER - INFO - Epoch 239 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882233 weight_norm_u: 25.222990 loss: 0.990485 +RANK_0 - 2026-01-29 02:27:53,937 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN - Minibatch 0: weight_norm_model: 143.882233 loss: 0.990485 grad_norm_before_clip: 3.620294 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:55,135 - TRAIN-LOGGER - INFO - Epoch 240 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882233 weight_norm_u: 25.218954 loss: 0.990485 grad_norm_before_clip: 3.620294 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:27:55,135 - TRAIN-LOGGER - INFO - Epoch 240 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882263 weight_norm_u: 25.222990 loss: 0.995131 +RANK_0 - 2026-01-29 02:27:59,982 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN - Minibatch 0: weight_norm_model: 143.882263 loss: 0.995131 grad_norm_before_clip: 7.041083 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:01,467 - TRAIN-LOGGER - INFO - Epoch 241 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882263 weight_norm_u: 25.218954 loss: 0.995131 grad_norm_before_clip: 7.041083 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:01,467 - TRAIN-LOGGER - INFO - Epoch 241 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882263 weight_norm_u: 25.222990 loss: 0.994901 +RANK_0 - 2026-01-29 02:28:06,058 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN - Minibatch 0: weight_norm_model: 143.882263 loss: 0.994901 grad_norm_before_clip: 7.887178 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:07,161 - TRAIN-LOGGER - INFO - Epoch 242 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882263 weight_norm_u: 25.218954 loss: 0.994901 grad_norm_before_clip: 7.887178 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:07,161 - TRAIN-LOGGER - INFO - Epoch 242 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882263 weight_norm_u: 25.222990 loss: 0.989059 +RANK_0 - 2026-01-29 02:28:13,116 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN - Minibatch 0: weight_norm_model: 143.882263 loss: 0.989059 grad_norm_before_clip: 3.433634 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:14,337 - TRAIN-LOGGER - INFO - Epoch 243 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882263 weight_norm_u: 25.218954 loss: 0.989059 grad_norm_before_clip: 3.433634 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:14,338 - TRAIN-LOGGER - INFO - Epoch 243 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882248 weight_norm_u: 25.222990 loss: 0.985358 +RANK_0 - 2026-01-29 02:28:19,214 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN - Minibatch 0: weight_norm_model: 143.882248 loss: 0.985358 grad_norm_before_clip: 1.955416 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:20,399 - TRAIN-LOGGER - INFO - Epoch 244 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882248 weight_norm_u: 25.218954 loss: 0.985358 grad_norm_before_clip: 1.955416 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:20,399 - TRAIN-LOGGER - INFO - Epoch 244 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882248 weight_norm_u: 25.222990 loss: 0.987120 +RANK_0 - 2026-01-29 02:28:26,026 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN - Minibatch 0: weight_norm_model: 143.882248 loss: 0.987120 grad_norm_before_clip: 2.929922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:27,171 - TRAIN-LOGGER - INFO - Epoch 245 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882248 weight_norm_u: 25.218954 loss: 0.987120 grad_norm_before_clip: 2.929922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:27,171 - TRAIN-LOGGER - INFO - Epoch 245 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882278 weight_norm_u: 25.222990 loss: 0.985503 +RANK_0 - 2026-01-29 02:28:31,678 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN - Minibatch 0: weight_norm_model: 143.882278 loss: 0.985503 grad_norm_before_clip: 2.260369 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:33,112 - TRAIN-LOGGER - INFO - Epoch 246 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882278 weight_norm_u: 25.218954 loss: 0.985503 grad_norm_before_clip: 2.260369 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:33,112 - TRAIN-LOGGER - INFO - Epoch 246 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882309 weight_norm_u: 25.222990 loss: 0.984150 +RANK_0 - 2026-01-29 02:28:37,503 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN - Minibatch 0: weight_norm_model: 143.882309 loss: 0.984150 grad_norm_before_clip: 3.926208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:38,672 - TRAIN-LOGGER - INFO - Epoch 247 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882309 weight_norm_u: 25.218954 loss: 0.984150 grad_norm_before_clip: 3.926208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:38,673 - TRAIN-LOGGER - INFO - Epoch 247 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882324 weight_norm_u: 25.222990 loss: 0.984087 +RANK_0 - 2026-01-29 02:28:43,708 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN - Minibatch 0: weight_norm_model: 143.882324 loss: 0.984087 grad_norm_before_clip: 3.421010 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:44,846 - TRAIN-LOGGER - INFO - Epoch 248 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882324 weight_norm_u: 25.218954 loss: 0.984087 grad_norm_before_clip: 3.421010 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:44,846 - TRAIN-LOGGER - INFO - Epoch 248 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882324 weight_norm_u: 25.222990 loss: 0.983605 +RANK_0 - 2026-01-29 02:28:49,110 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN - Minibatch 0: weight_norm_model: 143.882324 loss: 0.983605 grad_norm_before_clip: 1.211942 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:50,310 - TRAIN-LOGGER - INFO - Epoch 249 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882324 weight_norm_u: 25.218954 loss: 0.983605 grad_norm_before_clip: 1.211942 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:50,310 - TRAIN-LOGGER - INFO - Epoch 249 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882324 weight_norm_u: 25.222990 loss: 0.983256 +RANK_0 - 2026-01-29 02:28:55,094 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN - Minibatch 0: weight_norm_model: 143.882324 loss: 0.983256 grad_norm_before_clip: 1.461972 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:56,248 - TRAIN-LOGGER - INFO - Epoch 250 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882324 weight_norm_u: 25.218954 loss: 0.983256 grad_norm_before_clip: 1.461972 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:28:56,248 - TRAIN-LOGGER - INFO - Epoch 250 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882339 weight_norm_u: 25.222990 loss: 0.984041 +RANK_0 - 2026-01-29 02:29:00,778 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN - Minibatch 0: weight_norm_model: 143.882339 loss: 0.984041 grad_norm_before_clip: 3.294659 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:01,924 - TRAIN-LOGGER - INFO - Epoch 251 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882339 weight_norm_u: 25.218954 loss: 0.984041 grad_norm_before_clip: 3.294659 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:01,924 - TRAIN-LOGGER - INFO - Epoch 251 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882339 weight_norm_u: 25.222990 loss: 0.983159 +RANK_0 - 2026-01-29 02:29:07,288 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN - Minibatch 0: weight_norm_model: 143.882339 loss: 0.983159 grad_norm_before_clip: 2.656765 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:08,535 - TRAIN-LOGGER - INFO - Epoch 252 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882339 weight_norm_u: 25.218954 loss: 0.983159 grad_norm_before_clip: 2.656765 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:08,535 - TRAIN-LOGGER - INFO - Epoch 252 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882324 weight_norm_u: 25.222990 loss: 0.983258 +RANK_0 - 2026-01-29 02:29:12,811 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN - Minibatch 0: weight_norm_model: 143.882324 loss: 0.983258 grad_norm_before_clip: 1.686794 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:14,019 - TRAIN-LOGGER - INFO - Epoch 253 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882324 weight_norm_u: 25.218954 loss: 0.983258 grad_norm_before_clip: 1.686794 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:14,019 - TRAIN-LOGGER - INFO - Epoch 253 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882324 weight_norm_u: 25.222990 loss: 0.983264 +RANK_0 - 2026-01-29 02:29:18,743 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN - Minibatch 0: weight_norm_model: 143.882324 loss: 0.983264 grad_norm_before_clip: 2.200669 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:20,043 - TRAIN-LOGGER - INFO - Epoch 254 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882324 weight_norm_u: 25.218954 loss: 0.983264 grad_norm_before_clip: 2.200669 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:20,043 - TRAIN-LOGGER - INFO - Epoch 254 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882339 weight_norm_u: 25.222990 loss: 0.982137 +RANK_0 - 2026-01-29 02:29:24,798 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN - Minibatch 0: weight_norm_model: 143.882339 loss: 0.982137 grad_norm_before_clip: 1.016075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:25,987 - TRAIN-LOGGER - INFO - Epoch 255 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882339 weight_norm_u: 25.218954 loss: 0.982137 grad_norm_before_clip: 1.016075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:25,987 - TRAIN-LOGGER - INFO - Epoch 255 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882370 weight_norm_u: 25.222990 loss: 0.987623 +RANK_0 - 2026-01-29 02:29:31,165 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN - Minibatch 0: weight_norm_model: 143.882370 loss: 0.987623 grad_norm_before_clip: 4.612750 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:32,357 - TRAIN-LOGGER - INFO - Epoch 256 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882370 weight_norm_u: 25.218954 loss: 0.987623 grad_norm_before_clip: 4.612750 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:32,358 - TRAIN-LOGGER - INFO - Epoch 256 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882370 weight_norm_u: 25.222990 loss: 0.989585 +RANK_0 - 2026-01-29 02:29:37,199 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN - Minibatch 0: weight_norm_model: 143.882370 loss: 0.989585 grad_norm_before_clip: 4.918383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:38,354 - TRAIN-LOGGER - INFO - Epoch 257 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882370 weight_norm_u: 25.218954 loss: 0.989585 grad_norm_before_clip: 4.918383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:38,355 - TRAIN-LOGGER - INFO - Epoch 257 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882370 weight_norm_u: 25.222990 loss: 0.985353 +RANK_0 - 2026-01-29 02:29:43,211 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN - Minibatch 0: weight_norm_model: 143.882370 loss: 0.985353 grad_norm_before_clip: 3.915471 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:44,445 - TRAIN-LOGGER - INFO - Epoch 258 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882370 weight_norm_u: 25.218954 loss: 0.985353 grad_norm_before_clip: 3.915471 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:44,445 - TRAIN-LOGGER - INFO - Epoch 258 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882339 weight_norm_u: 25.222990 loss: 0.983233 +RANK_0 - 2026-01-29 02:29:49,479 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN - Minibatch 0: weight_norm_model: 143.882339 loss: 0.983233 grad_norm_before_clip: 2.370028 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:50,749 - TRAIN-LOGGER - INFO - Epoch 259 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882339 weight_norm_u: 25.218954 loss: 0.983233 grad_norm_before_clip: 2.370028 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:50,749 - TRAIN-LOGGER - INFO - Epoch 259 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882339 weight_norm_u: 25.222990 loss: 0.984328 +RANK_0 - 2026-01-29 02:29:55,309 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN - Minibatch 0: weight_norm_model: 143.882339 loss: 0.984328 grad_norm_before_clip: 2.582655 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:56,457 - TRAIN-LOGGER - INFO - Epoch 260 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882339 weight_norm_u: 25.218954 loss: 0.984328 grad_norm_before_clip: 2.582655 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:29:56,457 - TRAIN-LOGGER - INFO - Epoch 260 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882355 weight_norm_u: 25.222990 loss: 0.982689 +RANK_0 - 2026-01-29 02:30:01,252 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN - Minibatch 0: weight_norm_model: 143.882355 loss: 0.982689 grad_norm_before_clip: 2.566282 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:02,435 - TRAIN-LOGGER - INFO - Epoch 261 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882355 weight_norm_u: 25.218954 loss: 0.982689 grad_norm_before_clip: 2.566282 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:02,435 - TRAIN-LOGGER - INFO - Epoch 261 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882385 weight_norm_u: 25.222990 loss: 0.982207 +RANK_0 - 2026-01-29 02:30:06,304 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN - Minibatch 0: weight_norm_model: 143.882385 loss: 0.982207 grad_norm_before_clip: 3.385978 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:07,424 - TRAIN-LOGGER - INFO - Epoch 262 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882385 weight_norm_u: 25.218954 loss: 0.982207 grad_norm_before_clip: 3.385978 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:07,424 - TRAIN-LOGGER - INFO - Epoch 262 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882385 weight_norm_u: 25.222990 loss: 0.982888 +RANK_0 - 2026-01-29 02:30:12,169 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN - Minibatch 0: weight_norm_model: 143.882385 loss: 0.982888 grad_norm_before_clip: 4.327093 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:13,331 - TRAIN-LOGGER - INFO - Epoch 263 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882385 weight_norm_u: 25.218954 loss: 0.982888 grad_norm_before_clip: 4.327093 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:13,331 - TRAIN-LOGGER - INFO - Epoch 263 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882385 weight_norm_u: 25.222990 loss: 0.982476 +RANK_0 - 2026-01-29 02:30:18,124 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN - Minibatch 0: weight_norm_model: 143.882385 loss: 0.982476 grad_norm_before_clip: 2.058598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:19,239 - TRAIN-LOGGER - INFO - Epoch 264 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882385 weight_norm_u: 25.218954 loss: 0.982476 grad_norm_before_clip: 2.058598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:19,239 - TRAIN-LOGGER - INFO - Epoch 264 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882385 weight_norm_u: 25.222990 loss: 0.982608 +RANK_0 - 2026-01-29 02:30:23,925 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN - Minibatch 0: weight_norm_model: 143.882385 loss: 0.982608 grad_norm_before_clip: 3.558254 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:25,065 - TRAIN-LOGGER - INFO - Epoch 265 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882385 weight_norm_u: 25.218954 loss: 0.982608 grad_norm_before_clip: 3.558254 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:25,066 - TRAIN-LOGGER - INFO - Epoch 265 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882401 weight_norm_u: 25.222990 loss: 0.981984 +RANK_0 - 2026-01-29 02:30:30,040 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN - Minibatch 0: weight_norm_model: 143.882401 loss: 0.981984 grad_norm_before_clip: 1.959135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:31,284 - TRAIN-LOGGER - INFO - Epoch 266 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882401 weight_norm_u: 25.218954 loss: 0.981984 grad_norm_before_clip: 1.959135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:31,284 - TRAIN-LOGGER - INFO - Epoch 266 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882416 weight_norm_u: 25.222990 loss: 0.983021 +RANK_0 - 2026-01-29 02:30:35,926 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN - Minibatch 0: weight_norm_model: 143.882416 loss: 0.983021 grad_norm_before_clip: 3.919225 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:37,044 - TRAIN-LOGGER - INFO - Epoch 267 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882416 weight_norm_u: 25.218954 loss: 0.983021 grad_norm_before_clip: 3.919225 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:37,045 - TRAIN-LOGGER - INFO - Epoch 267 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882416 weight_norm_u: 25.222990 loss: 0.981159 +RANK_0 - 2026-01-29 02:30:41,959 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN - Minibatch 0: weight_norm_model: 143.882416 loss: 0.981159 grad_norm_before_clip: 2.162080 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:43,186 - TRAIN-LOGGER - INFO - Epoch 268 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882416 weight_norm_u: 25.218954 loss: 0.981159 grad_norm_before_clip: 2.162080 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:43,187 - TRAIN-LOGGER - INFO - Epoch 268 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882401 weight_norm_u: 25.222990 loss: 0.981077 +RANK_0 - 2026-01-29 02:30:47,994 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN - Minibatch 0: weight_norm_model: 143.882401 loss: 0.981077 grad_norm_before_clip: 1.976025 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:49,296 - TRAIN-LOGGER - INFO - Epoch 269 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882401 weight_norm_u: 25.218954 loss: 0.981077 grad_norm_before_clip: 1.976025 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:49,297 - TRAIN-LOGGER - INFO - Epoch 269 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882416 weight_norm_u: 25.222990 loss: 0.980999 +RANK_0 - 2026-01-29 02:30:54,227 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN - Minibatch 0: weight_norm_model: 143.882416 loss: 0.980999 grad_norm_before_clip: 2.228281 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:55,548 - TRAIN-LOGGER - INFO - Epoch 270 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882416 weight_norm_u: 25.218954 loss: 0.980999 grad_norm_before_clip: 2.228281 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:30:55,548 - TRAIN-LOGGER - INFO - Epoch 270 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882446 weight_norm_u: 25.222990 loss: 0.981125 +RANK_0 - 2026-01-29 02:30:59,884 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN - Minibatch 0: weight_norm_model: 143.882446 loss: 0.981125 grad_norm_before_clip: 2.106451 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:01,119 - TRAIN-LOGGER - INFO - Epoch 271 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882446 weight_norm_u: 25.218954 loss: 0.981125 grad_norm_before_clip: 2.106451 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:01,119 - TRAIN-LOGGER - INFO - Epoch 271 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882446 weight_norm_u: 25.222990 loss: 0.980535 +RANK_0 - 2026-01-29 02:31:06,188 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN - Minibatch 0: weight_norm_model: 143.882446 loss: 0.980535 grad_norm_before_clip: 2.611448 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:07,471 - TRAIN-LOGGER - INFO - Epoch 272 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882446 weight_norm_u: 25.218954 loss: 0.980535 grad_norm_before_clip: 2.611448 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:07,471 - TRAIN-LOGGER - INFO - Epoch 272 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882446 weight_norm_u: 25.222990 loss: 0.981543 +RANK_0 - 2026-01-29 02:31:12,140 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN - Minibatch 0: weight_norm_model: 143.882446 loss: 0.981543 grad_norm_before_clip: 2.209373 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:13,348 - TRAIN-LOGGER - INFO - Epoch 273 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882446 weight_norm_u: 25.218954 loss: 0.981543 grad_norm_before_clip: 2.209373 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:13,349 - TRAIN-LOGGER - INFO - Epoch 273 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882446 weight_norm_u: 25.222990 loss: 0.981687 +RANK_0 - 2026-01-29 02:31:18,363 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN - Minibatch 0: weight_norm_model: 143.882446 loss: 0.981687 grad_norm_before_clip: 2.546505 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:19,571 - TRAIN-LOGGER - INFO - Epoch 274 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882446 weight_norm_u: 25.218954 loss: 0.981687 grad_norm_before_clip: 2.546505 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:19,571 - TRAIN-LOGGER - INFO - Epoch 274 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882446 weight_norm_u: 25.222990 loss: 0.980119 +RANK_0 - 2026-01-29 02:31:24,260 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN - Minibatch 0: weight_norm_model: 143.882446 loss: 0.980119 grad_norm_before_clip: 1.656742 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:25,410 - TRAIN-LOGGER - INFO - Epoch 275 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882446 weight_norm_u: 25.218954 loss: 0.980119 grad_norm_before_clip: 1.656742 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:25,411 - TRAIN-LOGGER - INFO - Epoch 275 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882477 weight_norm_u: 25.222990 loss: 0.985922 +RANK_0 - 2026-01-29 02:31:30,032 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN - Minibatch 0: weight_norm_model: 143.882477 loss: 0.985922 grad_norm_before_clip: 4.382802 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:31,177 - TRAIN-LOGGER - INFO - Epoch 276 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882477 weight_norm_u: 25.218954 loss: 0.985922 grad_norm_before_clip: 4.382802 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:31,177 - TRAIN-LOGGER - INFO - Epoch 276 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.989582 +RANK_0 - 2026-01-29 02:31:35,228 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.989582 grad_norm_before_clip: 5.040561 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:36,400 - TRAIN-LOGGER - INFO - Epoch 277 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.989582 grad_norm_before_clip: 5.040561 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:36,401 - TRAIN-LOGGER - INFO - Epoch 277 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.986629 +RANK_0 - 2026-01-29 02:31:40,968 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.986629 grad_norm_before_clip: 5.107530 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:42,181 - TRAIN-LOGGER - INFO - Epoch 278 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.986629 grad_norm_before_clip: 5.107530 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:42,181 - TRAIN-LOGGER - INFO - Epoch 278 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.980966 +RANK_0 - 2026-01-29 02:31:46,884 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.980966 grad_norm_before_clip: 2.627697 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:48,108 - TRAIN-LOGGER - INFO - Epoch 279 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.980966 grad_norm_before_clip: 2.627697 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:48,108 - TRAIN-LOGGER - INFO - Epoch 279 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882492 weight_norm_u: 25.222990 loss: 0.982126 +RANK_0 - 2026-01-29 02:31:53,459 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN - Minibatch 0: weight_norm_model: 143.882492 loss: 0.982126 grad_norm_before_clip: 3.702847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:54,657 - TRAIN-LOGGER - INFO - Epoch 280 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882492 weight_norm_u: 25.218954 loss: 0.982126 grad_norm_before_clip: 3.702847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:31:54,657 - TRAIN-LOGGER - INFO - Epoch 280 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882507 weight_norm_u: 25.222990 loss: 0.987683 +RANK_0 - 2026-01-29 02:31:59,129 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN - Minibatch 0: weight_norm_model: 143.882507 loss: 0.987683 grad_norm_before_clip: 6.024002 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:00,322 - TRAIN-LOGGER - INFO - Epoch 281 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882507 weight_norm_u: 25.218954 loss: 0.987683 grad_norm_before_clip: 6.024002 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:00,322 - TRAIN-LOGGER - INFO - Epoch 281 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882523 weight_norm_u: 25.222990 loss: 0.986246 +RANK_0 - 2026-01-29 02:32:05,733 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN - Minibatch 0: weight_norm_model: 143.882523 loss: 0.986246 grad_norm_before_clip: 5.014098 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:06,872 - TRAIN-LOGGER - INFO - Epoch 282 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882523 weight_norm_u: 25.218954 loss: 0.986246 grad_norm_before_clip: 5.014098 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:06,872 - TRAIN-LOGGER - INFO - Epoch 282 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.983076 +RANK_0 - 2026-01-29 02:32:11,501 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.983076 grad_norm_before_clip: 1.824196 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:12,645 - TRAIN-LOGGER - INFO - Epoch 283 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.983076 grad_norm_before_clip: 1.824196 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:12,645 - TRAIN-LOGGER - INFO - Epoch 283 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.983468 +RANK_0 - 2026-01-29 02:32:17,571 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.983468 grad_norm_before_clip: 3.148238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:18,789 - TRAIN-LOGGER - INFO - Epoch 284 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.983468 grad_norm_before_clip: 3.148238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:18,790 - TRAIN-LOGGER - INFO - Epoch 284 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.982754 +RANK_0 - 2026-01-29 02:32:22,969 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.982754 grad_norm_before_clip: 3.791995 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:24,099 - TRAIN-LOGGER - INFO - Epoch 285 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.982754 grad_norm_before_clip: 3.791995 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:24,100 - TRAIN-LOGGER - INFO - Epoch 285 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.980997 +RANK_0 - 2026-01-29 02:32:28,535 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.980997 grad_norm_before_clip: 2.575469 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:29,976 - TRAIN-LOGGER - INFO - Epoch 286 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.980997 grad_norm_before_clip: 2.575469 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:29,976 - TRAIN-LOGGER - INFO - Epoch 286 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.982119 +RANK_0 - 2026-01-29 02:32:34,584 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.982119 grad_norm_before_clip: 3.087044 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:35,807 - TRAIN-LOGGER - INFO - Epoch 287 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.982119 grad_norm_before_clip: 3.087044 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:35,808 - TRAIN-LOGGER - INFO - Epoch 287 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882553 weight_norm_u: 25.222990 loss: 0.984532 +RANK_0 - 2026-01-29 02:32:40,123 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN - Minibatch 0: weight_norm_model: 143.882553 loss: 0.984532 grad_norm_before_clip: 5.345019 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:41,428 - TRAIN-LOGGER - INFO - Epoch 288 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882553 weight_norm_u: 25.218954 loss: 0.984532 grad_norm_before_clip: 5.345019 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:41,428 - TRAIN-LOGGER - INFO - Epoch 288 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882568 weight_norm_u: 25.222990 loss: 0.980792 +RANK_0 - 2026-01-29 02:32:46,465 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN - Minibatch 0: weight_norm_model: 143.882568 loss: 0.980792 grad_norm_before_clip: 3.220650 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:47,665 - TRAIN-LOGGER - INFO - Epoch 289 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882568 weight_norm_u: 25.218954 loss: 0.980792 grad_norm_before_clip: 3.220650 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:47,665 - TRAIN-LOGGER - INFO - Epoch 289 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882599 weight_norm_u: 25.222990 loss: 0.980656 +RANK_0 - 2026-01-29 02:32:52,039 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN - Minibatch 0: weight_norm_model: 143.882599 loss: 0.980656 grad_norm_before_clip: 3.913691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:53,484 - TRAIN-LOGGER - INFO - Epoch 290 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882599 weight_norm_u: 25.218954 loss: 0.980656 grad_norm_before_clip: 3.913691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:53,484 - TRAIN-LOGGER - INFO - Epoch 290 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.981335 +RANK_0 - 2026-01-29 02:32:58,104 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.981335 grad_norm_before_clip: 4.381890 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:59,337 - TRAIN-LOGGER - INFO - Epoch 291 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.981335 grad_norm_before_clip: 4.381890 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:32:59,337 - TRAIN-LOGGER - INFO - Epoch 291 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.980353 +RANK_0 - 2026-01-29 02:33:03,781 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.980353 grad_norm_before_clip: 2.482820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:05,278 - TRAIN-LOGGER - INFO - Epoch 292 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.980353 grad_norm_before_clip: 2.482820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:05,278 - TRAIN-LOGGER - INFO - Epoch 292 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.980199 +RANK_0 - 2026-01-29 02:33:09,865 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.980199 grad_norm_before_clip: 2.835707 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:11,002 - TRAIN-LOGGER - INFO - Epoch 293 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.980199 grad_norm_before_clip: 2.835707 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:11,002 - TRAIN-LOGGER - INFO - Epoch 293 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882614 weight_norm_u: 25.222990 loss: 0.981909 +RANK_0 - 2026-01-29 02:33:15,331 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN - Minibatch 0: weight_norm_model: 143.882614 loss: 0.981909 grad_norm_before_clip: 3.762832 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:16,450 - TRAIN-LOGGER - INFO - Epoch 294 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882614 weight_norm_u: 25.218954 loss: 0.981909 grad_norm_before_clip: 3.762832 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:16,450 - TRAIN-LOGGER - INFO - Epoch 294 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882629 weight_norm_u: 25.222990 loss: 0.979830 +RANK_0 - 2026-01-29 02:33:21,506 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN - Minibatch 0: weight_norm_model: 143.882629 loss: 0.979830 grad_norm_before_clip: 2.119301 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:22,730 - TRAIN-LOGGER - INFO - Epoch 295 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882629 weight_norm_u: 25.218954 loss: 0.979830 grad_norm_before_clip: 2.119301 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:22,730 - TRAIN-LOGGER - INFO - Epoch 295 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.979658 +RANK_0 - 2026-01-29 02:33:27,380 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.979658 grad_norm_before_clip: 2.501604 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:28,516 - TRAIN-LOGGER - INFO - Epoch 296 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.979658 grad_norm_before_clip: 2.501604 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:28,516 - TRAIN-LOGGER - INFO - Epoch 296 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.980046 +RANK_0 - 2026-01-29 02:33:33,395 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.980046 grad_norm_before_clip: 3.903155 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:34,549 - TRAIN-LOGGER - INFO - Epoch 297 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.980046 grad_norm_before_clip: 3.903155 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:34,549 - TRAIN-LOGGER - INFO - Epoch 297 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.977776 +RANK_0 - 2026-01-29 02:33:39,203 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.977776 grad_norm_before_clip: 1.664288 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:40,424 - TRAIN-LOGGER - INFO - Epoch 298 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.977776 grad_norm_before_clip: 1.664288 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:40,425 - TRAIN-LOGGER - INFO - Epoch 298 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882645 weight_norm_u: 25.222990 loss: 0.980707 +RANK_0 - 2026-01-29 02:33:44,871 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN - Minibatch 0: weight_norm_model: 143.882645 loss: 0.980707 grad_norm_before_clip: 3.848000 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:46,105 - TRAIN-LOGGER - INFO - Epoch 299 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882645 weight_norm_u: 25.218954 loss: 0.980707 grad_norm_before_clip: 3.848000 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:46,105 - TRAIN-LOGGER - INFO - Epoch 299 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882660 weight_norm_u: 25.222990 loss: 0.981943 +RANK_0 - 2026-01-29 02:33:50,156 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN - Minibatch 0: weight_norm_model: 143.882660 loss: 0.981943 grad_norm_before_clip: 4.786485 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:51,269 - TRAIN-LOGGER - INFO - Epoch 300 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882660 weight_norm_u: 25.218954 loss: 0.981943 grad_norm_before_clip: 4.786485 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:51,270 - TRAIN-LOGGER - INFO - Epoch 300 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882675 weight_norm_u: 25.222990 loss: 0.979291 +RANK_0 - 2026-01-29 02:33:55,457 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN - Minibatch 0: weight_norm_model: 143.882675 loss: 0.979291 grad_norm_before_clip: 2.414604 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:56,744 - TRAIN-LOGGER - INFO - Epoch 301 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882675 weight_norm_u: 25.218954 loss: 0.979291 grad_norm_before_clip: 2.414604 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:33:56,747 - TRAIN-LOGGER - INFO - Epoch 301 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882706 weight_norm_u: 25.222990 loss: 0.979882 +RANK_0 - 2026-01-29 02:34:01,021 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN - Minibatch 0: weight_norm_model: 143.882706 loss: 0.979882 grad_norm_before_clip: 4.204621 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:02,197 - TRAIN-LOGGER - INFO - Epoch 302 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882706 weight_norm_u: 25.218954 loss: 0.979882 grad_norm_before_clip: 4.204621 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:02,197 - TRAIN-LOGGER - INFO - Epoch 302 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.981811 +RANK_0 - 2026-01-29 02:34:06,836 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.981811 grad_norm_before_clip: 4.345522 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:08,039 - TRAIN-LOGGER - INFO - Epoch 303 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.981811 grad_norm_before_clip: 4.345522 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:08,039 - TRAIN-LOGGER - INFO - Epoch 303 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.979100 +RANK_0 - 2026-01-29 02:34:12,691 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.979100 grad_norm_before_clip: 2.661359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:13,828 - TRAIN-LOGGER - INFO - Epoch 304 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.979100 grad_norm_before_clip: 2.661359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:13,829 - TRAIN-LOGGER - INFO - Epoch 304 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.977842 +RANK_0 - 2026-01-29 02:34:18,437 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.977842 grad_norm_before_clip: 1.674226 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:19,732 - TRAIN-LOGGER - INFO - Epoch 305 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.977842 grad_norm_before_clip: 1.674226 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:19,732 - TRAIN-LOGGER - INFO - Epoch 305 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882721 weight_norm_u: 25.222990 loss: 0.979390 +RANK_0 - 2026-01-29 02:34:24,861 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN - Minibatch 0: weight_norm_model: 143.882721 loss: 0.979390 grad_norm_before_clip: 4.000061 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:26,051 - TRAIN-LOGGER - INFO - Epoch 306 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882721 weight_norm_u: 25.218954 loss: 0.979390 grad_norm_before_clip: 4.000061 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:26,051 - TRAIN-LOGGER - INFO - Epoch 306 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882736 weight_norm_u: 25.222990 loss: 0.979255 +RANK_0 - 2026-01-29 02:34:30,465 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN - Minibatch 0: weight_norm_model: 143.882736 loss: 0.979255 grad_norm_before_clip: 4.008959 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:31,644 - TRAIN-LOGGER - INFO - Epoch 307 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882736 weight_norm_u: 25.218954 loss: 0.979255 grad_norm_before_clip: 4.008959 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:31,644 - TRAIN-LOGGER - INFO - Epoch 307 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.976802 +RANK_0 - 2026-01-29 02:34:36,955 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.976802 grad_norm_before_clip: 2.027844 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:38,163 - TRAIN-LOGGER - INFO - Epoch 308 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.976802 grad_norm_before_clip: 2.027844 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:38,163 - TRAIN-LOGGER - INFO - Epoch 308 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882767 weight_norm_u: 25.222990 loss: 0.977698 +RANK_0 - 2026-01-29 02:34:42,974 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN - Minibatch 0: weight_norm_model: 143.882767 loss: 0.977698 grad_norm_before_clip: 3.556867 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:44,470 - TRAIN-LOGGER - INFO - Epoch 309 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882767 weight_norm_u: 25.218954 loss: 0.977698 grad_norm_before_clip: 3.556867 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:44,471 - TRAIN-LOGGER - INFO - Epoch 309 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.977015 +RANK_0 - 2026-01-29 02:34:49,816 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.977015 grad_norm_before_clip: 1.615336 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:50,999 - TRAIN-LOGGER - INFO - Epoch 310 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.977015 grad_norm_before_clip: 1.615336 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:50,999 - TRAIN-LOGGER - INFO - Epoch 310 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.976621 +RANK_0 - 2026-01-29 02:34:56,108 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.976621 grad_norm_before_clip: 1.377861 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:57,293 - TRAIN-LOGGER - INFO - Epoch 311 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.976621 grad_norm_before_clip: 1.377861 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:34:57,294 - TRAIN-LOGGER - INFO - Epoch 311 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.976430 +RANK_0 - 2026-01-29 02:35:01,743 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.976430 grad_norm_before_clip: 1.347843 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:02,866 - TRAIN-LOGGER - INFO - Epoch 312 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.976430 grad_norm_before_clip: 1.347843 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:02,866 - TRAIN-LOGGER - INFO - Epoch 312 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.977288 +RANK_0 - 2026-01-29 02:35:07,131 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.977288 grad_norm_before_clip: 2.403018 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:08,640 - TRAIN-LOGGER - INFO - Epoch 313 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.977288 grad_norm_before_clip: 2.403018 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:08,640 - TRAIN-LOGGER - INFO - Epoch 313 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882751 weight_norm_u: 25.222990 loss: 0.977123 +RANK_0 - 2026-01-29 02:35:12,692 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN - Minibatch 0: weight_norm_model: 143.882751 loss: 0.977123 grad_norm_before_clip: 2.512341 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:13,831 - TRAIN-LOGGER - INFO - Epoch 314 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882751 weight_norm_u: 25.218954 loss: 0.977123 grad_norm_before_clip: 2.512341 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:13,832 - TRAIN-LOGGER - INFO - Epoch 314 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882767 weight_norm_u: 25.222990 loss: 0.977985 +RANK_0 - 2026-01-29 02:35:18,177 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN - Minibatch 0: weight_norm_model: 143.882767 loss: 0.977985 grad_norm_before_clip: 3.733257 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:19,318 - TRAIN-LOGGER - INFO - Epoch 315 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882767 weight_norm_u: 25.218954 loss: 0.977985 grad_norm_before_clip: 3.733257 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:19,318 - TRAIN-LOGGER - INFO - Epoch 315 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882767 weight_norm_u: 25.222990 loss: 0.976277 +RANK_0 - 2026-01-29 02:35:23,739 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN - Minibatch 0: weight_norm_model: 143.882767 loss: 0.976277 grad_norm_before_clip: 1.342205 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:24,938 - TRAIN-LOGGER - INFO - Epoch 316 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882767 weight_norm_u: 25.218954 loss: 0.976277 grad_norm_before_clip: 1.342205 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:24,938 - TRAIN-LOGGER - INFO - Epoch 316 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882797 weight_norm_u: 25.222990 loss: 0.975391 +RANK_0 - 2026-01-29 02:35:29,230 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN - Minibatch 0: weight_norm_model: 143.882797 loss: 0.975391 grad_norm_before_clip: 2.289839 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:30,424 - TRAIN-LOGGER - INFO - Epoch 317 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882797 weight_norm_u: 25.218954 loss: 0.975391 grad_norm_before_clip: 2.289839 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:30,424 - TRAIN-LOGGER - INFO - Epoch 317 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882812 weight_norm_u: 25.222990 loss: 0.976201 +RANK_0 - 2026-01-29 02:35:34,570 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN - Minibatch 0: weight_norm_model: 143.882812 loss: 0.976201 grad_norm_before_clip: 1.582125 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:35,767 - TRAIN-LOGGER - INFO - Epoch 318 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882812 weight_norm_u: 25.218954 loss: 0.976201 grad_norm_before_clip: 1.582125 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:35,767 - TRAIN-LOGGER - INFO - Epoch 318 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882828 weight_norm_u: 25.222990 loss: 0.976566 +RANK_0 - 2026-01-29 02:35:40,134 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN - Minibatch 0: weight_norm_model: 143.882828 loss: 0.976566 grad_norm_before_clip: 1.876856 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:41,263 - TRAIN-LOGGER - INFO - Epoch 319 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882828 weight_norm_u: 25.218954 loss: 0.976566 grad_norm_before_clip: 1.876856 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:41,264 - TRAIN-LOGGER - INFO - Epoch 319 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882828 weight_norm_u: 25.222990 loss: 0.974712 +RANK_0 - 2026-01-29 02:35:45,715 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN - Minibatch 0: weight_norm_model: 143.882828 loss: 0.974712 grad_norm_before_clip: 1.330940 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:46,837 - TRAIN-LOGGER - INFO - Epoch 320 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882828 weight_norm_u: 25.218954 loss: 0.974712 grad_norm_before_clip: 1.330940 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:46,837 - TRAIN-LOGGER - INFO - Epoch 320 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882843 weight_norm_u: 25.222990 loss: 0.974178 +RANK_0 - 2026-01-29 02:35:51,391 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN - Minibatch 0: weight_norm_model: 143.882843 loss: 0.974178 grad_norm_before_clip: 1.942337 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:52,508 - TRAIN-LOGGER - INFO - Epoch 321 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882843 weight_norm_u: 25.218954 loss: 0.974178 grad_norm_before_clip: 1.942337 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:52,508 - TRAIN-LOGGER - INFO - Epoch 321 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.975578 +RANK_0 - 2026-01-29 02:35:57,092 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.975578 grad_norm_before_clip: 3.099335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:58,278 - TRAIN-LOGGER - INFO - Epoch 322 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.975578 grad_norm_before_clip: 3.099335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:35:58,279 - TRAIN-LOGGER - INFO - Epoch 322 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882874 weight_norm_u: 25.222990 loss: 0.975094 +RANK_0 - 2026-01-29 02:36:02,733 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN - Minibatch 0: weight_norm_model: 143.882874 loss: 0.975094 grad_norm_before_clip: 1.982278 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:03,923 - TRAIN-LOGGER - INFO - Epoch 323 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882874 weight_norm_u: 25.218954 loss: 0.975094 grad_norm_before_clip: 1.982278 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:03,923 - TRAIN-LOGGER - INFO - Epoch 323 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882889 weight_norm_u: 25.222990 loss: 0.974513 +RANK_0 - 2026-01-29 02:36:08,702 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN - Minibatch 0: weight_norm_model: 143.882889 loss: 0.974513 grad_norm_before_clip: 1.366703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:09,858 - TRAIN-LOGGER - INFO - Epoch 324 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882889 weight_norm_u: 25.218954 loss: 0.974513 grad_norm_before_clip: 1.366703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:09,859 - TRAIN-LOGGER - INFO - Epoch 324 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882889 weight_norm_u: 25.222990 loss: 0.974518 +RANK_0 - 2026-01-29 02:36:14,718 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN - Minibatch 0: weight_norm_model: 143.882889 loss: 0.974518 grad_norm_before_clip: 1.884733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:15,903 - TRAIN-LOGGER - INFO - Epoch 325 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882889 weight_norm_u: 25.218954 loss: 0.974518 grad_norm_before_clip: 1.884733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:15,903 - TRAIN-LOGGER - INFO - Epoch 325 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882919 weight_norm_u: 25.222990 loss: 0.977011 +RANK_0 - 2026-01-29 02:36:20,756 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN - Minibatch 0: weight_norm_model: 143.882919 loss: 0.977011 grad_norm_before_clip: 5.312039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:21,942 - TRAIN-LOGGER - INFO - Epoch 326 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882919 weight_norm_u: 25.218954 loss: 0.977011 grad_norm_before_clip: 5.312039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:21,942 - TRAIN-LOGGER - INFO - Epoch 326 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882935 weight_norm_u: 25.222990 loss: 0.974183 +RANK_0 - 2026-01-29 02:36:26,711 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN - Minibatch 0: weight_norm_model: 143.882935 loss: 0.974183 grad_norm_before_clip: 2.282224 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:27,889 - TRAIN-LOGGER - INFO - Epoch 327 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882935 weight_norm_u: 25.218954 loss: 0.974183 grad_norm_before_clip: 2.282224 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:27,889 - TRAIN-LOGGER - INFO - Epoch 327 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882980 weight_norm_u: 25.222990 loss: 0.973851 +RANK_0 - 2026-01-29 02:36:32,170 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN - Minibatch 0: weight_norm_model: 143.882980 loss: 0.973851 grad_norm_before_clip: 1.494784 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:33,388 - TRAIN-LOGGER - INFO - Epoch 328 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882980 weight_norm_u: 25.218954 loss: 0.973851 grad_norm_before_clip: 1.494784 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:33,389 - TRAIN-LOGGER - INFO - Epoch 328 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.882996 weight_norm_u: 25.222990 loss: 0.975014 +RANK_0 - 2026-01-29 02:36:37,954 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN - Minibatch 0: weight_norm_model: 143.882996 loss: 0.975014 grad_norm_before_clip: 3.374658 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:39,180 - TRAIN-LOGGER - INFO - Epoch 329 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.882996 weight_norm_u: 25.218954 loss: 0.975014 grad_norm_before_clip: 3.374658 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:39,181 - TRAIN-LOGGER - INFO - Epoch 329 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883011 weight_norm_u: 25.222990 loss: 0.974219 +RANK_0 - 2026-01-29 02:36:43,557 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN - Minibatch 0: weight_norm_model: 143.883011 loss: 0.974219 grad_norm_before_clip: 2.274560 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:44,743 - TRAIN-LOGGER - INFO - Epoch 330 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883011 weight_norm_u: 25.218954 loss: 0.974219 grad_norm_before_clip: 2.274560 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:44,743 - TRAIN-LOGGER - INFO - Epoch 330 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883026 weight_norm_u: 25.222990 loss: 0.973635 +RANK_0 - 2026-01-29 02:36:49,024 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN - Minibatch 0: weight_norm_model: 143.883026 loss: 0.973635 grad_norm_before_clip: 3.177148 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:50,161 - TRAIN-LOGGER - INFO - Epoch 331 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883026 weight_norm_u: 25.218954 loss: 0.973635 grad_norm_before_clip: 3.177148 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:50,161 - TRAIN-LOGGER - INFO - Epoch 331 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883026 weight_norm_u: 25.222990 loss: 0.972202 +RANK_0 - 2026-01-29 02:36:54,457 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN - Minibatch 0: weight_norm_model: 143.883026 loss: 0.972202 grad_norm_before_clip: 1.094708 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:55,655 - TRAIN-LOGGER - INFO - Epoch 332 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883026 weight_norm_u: 25.218954 loss: 0.972202 grad_norm_before_clip: 1.094708 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:36:55,656 - TRAIN-LOGGER - INFO - Epoch 332 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883041 weight_norm_u: 25.222990 loss: 0.971921 +RANK_0 - 2026-01-29 02:37:00,282 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN - Minibatch 0: weight_norm_model: 143.883041 loss: 0.971921 grad_norm_before_clip: 4.160634 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:01,419 - TRAIN-LOGGER - INFO - Epoch 333 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883041 weight_norm_u: 25.218954 loss: 0.971921 grad_norm_before_clip: 4.160634 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:01,419 - TRAIN-LOGGER - INFO - Epoch 333 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883041 weight_norm_u: 25.222990 loss: 0.973616 +RANK_0 - 2026-01-29 02:37:05,757 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN - Minibatch 0: weight_norm_model: 143.883041 loss: 0.973616 grad_norm_before_clip: 3.403415 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:06,960 - TRAIN-LOGGER - INFO - Epoch 334 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883041 weight_norm_u: 25.218954 loss: 0.973616 grad_norm_before_clip: 3.403415 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:06,960 - TRAIN-LOGGER - INFO - Epoch 334 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.972616 +RANK_0 - 2026-01-29 02:37:11,186 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.972616 grad_norm_before_clip: 2.231429 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:12,396 - TRAIN-LOGGER - INFO - Epoch 335 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.972616 grad_norm_before_clip: 2.231429 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:12,396 - TRAIN-LOGGER - INFO - Epoch 335 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883057 weight_norm_u: 25.222990 loss: 0.974005 +RANK_0 - 2026-01-29 02:37:16,765 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN - Minibatch 0: weight_norm_model: 143.883057 loss: 0.974005 grad_norm_before_clip: 4.790339 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:17,966 - TRAIN-LOGGER - INFO - Epoch 336 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883057 weight_norm_u: 25.218954 loss: 0.974005 grad_norm_before_clip: 4.790339 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:17,967 - TRAIN-LOGGER - INFO - Epoch 336 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883072 weight_norm_u: 25.222990 loss: 0.974590 +RANK_0 - 2026-01-29 02:37:22,734 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN - Minibatch 0: weight_norm_model: 143.883072 loss: 0.974590 grad_norm_before_clip: 4.467199 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:23,910 - TRAIN-LOGGER - INFO - Epoch 337 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883072 weight_norm_u: 25.218954 loss: 0.974590 grad_norm_before_clip: 4.467199 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:23,910 - TRAIN-LOGGER - INFO - Epoch 337 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883087 weight_norm_u: 25.222990 loss: 0.973153 +RANK_0 - 2026-01-29 02:37:28,383 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN - Minibatch 0: weight_norm_model: 143.883087 loss: 0.973153 grad_norm_before_clip: 2.848139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:29,582 - TRAIN-LOGGER - INFO - Epoch 338 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883087 weight_norm_u: 25.218954 loss: 0.973153 grad_norm_before_clip: 2.848139 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:29,582 - TRAIN-LOGGER - INFO - Epoch 338 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883102 weight_norm_u: 25.222990 loss: 0.976668 +RANK_0 - 2026-01-29 02:37:34,351 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN - Minibatch 0: weight_norm_model: 143.883102 loss: 0.976668 grad_norm_before_clip: 5.038091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:35,566 - TRAIN-LOGGER - INFO - Epoch 339 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883102 weight_norm_u: 25.218954 loss: 0.976668 grad_norm_before_clip: 5.038091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:35,567 - TRAIN-LOGGER - INFO - Epoch 339 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883118 weight_norm_u: 25.222990 loss: 0.974417 +RANK_0 - 2026-01-29 02:37:40,525 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN - Minibatch 0: weight_norm_model: 143.883118 loss: 0.974417 grad_norm_before_clip: 4.629703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:41,671 - TRAIN-LOGGER - INFO - Epoch 340 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883118 weight_norm_u: 25.218954 loss: 0.974417 grad_norm_before_clip: 4.629703 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:41,672 - TRAIN-LOGGER - INFO - Epoch 340 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.973801 +RANK_0 - 2026-01-29 02:37:46,367 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.973801 grad_norm_before_clip: 2.152271 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:47,495 - TRAIN-LOGGER - INFO - Epoch 341 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.973801 grad_norm_before_clip: 2.152271 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:47,496 - TRAIN-LOGGER - INFO - Epoch 341 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883133 weight_norm_u: 25.222990 loss: 0.975248 +RANK_0 - 2026-01-29 02:37:52,385 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN - Minibatch 0: weight_norm_model: 143.883133 loss: 0.975248 grad_norm_before_clip: 6.421844 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:53,533 - TRAIN-LOGGER - INFO - Epoch 342 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883133 weight_norm_u: 25.218954 loss: 0.975248 grad_norm_before_clip: 6.421844 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:53,533 - TRAIN-LOGGER - INFO - Epoch 342 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883148 weight_norm_u: 25.222990 loss: 0.974798 +RANK_0 - 2026-01-29 02:37:57,819 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN - Minibatch 0: weight_norm_model: 143.883148 loss: 0.974798 grad_norm_before_clip: 5.803540 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:58,950 - TRAIN-LOGGER - INFO - Epoch 343 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883148 weight_norm_u: 25.218954 loss: 0.974798 grad_norm_before_clip: 5.803540 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:37:58,950 - TRAIN-LOGGER - INFO - Epoch 343 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883148 weight_norm_u: 25.222990 loss: 0.971622 +RANK_0 - 2026-01-29 02:38:03,552 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN - Minibatch 0: weight_norm_model: 143.883148 loss: 0.971622 grad_norm_before_clip: 1.540602 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:04,661 - TRAIN-LOGGER - INFO - Epoch 344 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883148 weight_norm_u: 25.218954 loss: 0.971622 grad_norm_before_clip: 1.540602 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:04,662 - TRAIN-LOGGER - INFO - Epoch 344 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883148 weight_norm_u: 25.222990 loss: 0.974544 +RANK_0 - 2026-01-29 02:38:08,821 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN - Minibatch 0: weight_norm_model: 143.883148 loss: 0.974544 grad_norm_before_clip: 4.002094 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:09,962 - TRAIN-LOGGER - INFO - Epoch 345 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883148 weight_norm_u: 25.218954 loss: 0.974544 grad_norm_before_clip: 4.002094 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:09,962 - TRAIN-LOGGER - INFO - Epoch 345 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.973831 +RANK_0 - 2026-01-29 02:38:14,229 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.973831 grad_norm_before_clip: 3.746842 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:15,360 - TRAIN-LOGGER - INFO - Epoch 346 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.973831 grad_norm_before_clip: 3.746842 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:15,360 - TRAIN-LOGGER - INFO - Epoch 346 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.972699 +RANK_0 - 2026-01-29 02:38:19,514 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.972699 grad_norm_before_clip: 2.947659 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:20,682 - TRAIN-LOGGER - INFO - Epoch 347 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.972699 grad_norm_before_clip: 2.947659 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:20,683 - TRAIN-LOGGER - INFO - Epoch 347 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.972569 +RANK_0 - 2026-01-29 02:38:24,975 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.972569 grad_norm_before_clip: 3.758466 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:26,117 - TRAIN-LOGGER - INFO - Epoch 348 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.972569 grad_norm_before_clip: 3.758466 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:26,117 - TRAIN-LOGGER - INFO - Epoch 348 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.971014 +RANK_0 - 2026-01-29 02:38:30,582 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.971014 grad_norm_before_clip: 1.963962 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:31,793 - TRAIN-LOGGER - INFO - Epoch 349 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.971014 grad_norm_before_clip: 1.963962 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:31,793 - TRAIN-LOGGER - INFO - Epoch 349 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883194 weight_norm_u: 25.222990 loss: 0.974375 +RANK_0 - 2026-01-29 02:38:36,046 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN - Minibatch 0: weight_norm_model: 143.883194 loss: 0.974375 grad_norm_before_clip: 5.232537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:37,283 - TRAIN-LOGGER - INFO - Epoch 350 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883194 weight_norm_u: 25.218954 loss: 0.974375 grad_norm_before_clip: 5.232537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:37,284 - TRAIN-LOGGER - INFO - Epoch 350 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883194 weight_norm_u: 25.222990 loss: 0.976988 +RANK_0 - 2026-01-29 02:38:41,600 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN - Minibatch 0: weight_norm_model: 143.883194 loss: 0.976988 grad_norm_before_clip: 4.464149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:42,706 - TRAIN-LOGGER - INFO - Epoch 351 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883194 weight_norm_u: 25.218954 loss: 0.976988 grad_norm_before_clip: 4.464149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:42,707 - TRAIN-LOGGER - INFO - Epoch 351 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883194 weight_norm_u: 25.222990 loss: 0.971441 +RANK_0 - 2026-01-29 02:38:46,996 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN - Minibatch 0: weight_norm_model: 143.883194 loss: 0.971441 grad_norm_before_clip: 2.130924 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:48,195 - TRAIN-LOGGER - INFO - Epoch 352 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883194 weight_norm_u: 25.218954 loss: 0.971441 grad_norm_before_clip: 2.130924 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:48,196 - TRAIN-LOGGER - INFO - Epoch 352 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.973492 +RANK_0 - 2026-01-29 02:38:52,516 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.973492 grad_norm_before_clip: 4.925695 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:53,706 - TRAIN-LOGGER - INFO - Epoch 353 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.973492 grad_norm_before_clip: 4.925695 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:53,706 - TRAIN-LOGGER - INFO - Epoch 353 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883179 weight_norm_u: 25.222990 loss: 0.974420 +RANK_0 - 2026-01-29 02:38:58,656 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN - Minibatch 0: weight_norm_model: 143.883179 loss: 0.974420 grad_norm_before_clip: 4.834776 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:59,789 - TRAIN-LOGGER - INFO - Epoch 354 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883179 weight_norm_u: 25.218954 loss: 0.974420 grad_norm_before_clip: 4.834776 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:38:59,789 - TRAIN-LOGGER - INFO - Epoch 354 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883194 weight_norm_u: 25.222990 loss: 0.972496 +RANK_0 - 2026-01-29 02:39:04,788 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN - Minibatch 0: weight_norm_model: 143.883194 loss: 0.972496 grad_norm_before_clip: 2.917126 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:05,976 - TRAIN-LOGGER - INFO - Epoch 355 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883194 weight_norm_u: 25.218954 loss: 0.972496 grad_norm_before_clip: 2.917126 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:05,976 - TRAIN-LOGGER - INFO - Epoch 355 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883194 weight_norm_u: 25.222990 loss: 0.972121 +RANK_0 - 2026-01-29 02:39:10,857 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN - Minibatch 0: weight_norm_model: 143.883194 loss: 0.972121 grad_norm_before_clip: 4.056834 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:12,064 - TRAIN-LOGGER - INFO - Epoch 356 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883194 weight_norm_u: 25.218954 loss: 0.972121 grad_norm_before_clip: 4.056834 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:12,064 - TRAIN-LOGGER - INFO - Epoch 356 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883209 weight_norm_u: 25.222990 loss: 0.972672 +RANK_0 - 2026-01-29 02:39:16,856 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN - Minibatch 0: weight_norm_model: 143.883209 loss: 0.972672 grad_norm_before_clip: 4.533511 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:18,107 - TRAIN-LOGGER - INFO - Epoch 357 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883209 weight_norm_u: 25.218954 loss: 0.972672 grad_norm_before_clip: 4.533511 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:18,108 - TRAIN-LOGGER - INFO - Epoch 357 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.972004 +RANK_0 - 2026-01-29 02:39:22,513 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.972004 grad_norm_before_clip: 2.700985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:23,652 - TRAIN-LOGGER - INFO - Epoch 358 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.972004 grad_norm_before_clip: 2.700985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:23,653 - TRAIN-LOGGER - INFO - Epoch 358 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.970600 +RANK_0 - 2026-01-29 02:39:28,229 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.970600 grad_norm_before_clip: 2.697035 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:29,344 - TRAIN-LOGGER - INFO - Epoch 359 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.970600 grad_norm_before_clip: 2.697035 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:29,344 - TRAIN-LOGGER - INFO - Epoch 359 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.970591 +RANK_0 - 2026-01-29 02:39:33,970 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.970591 grad_norm_before_clip: 2.521785 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:35,086 - TRAIN-LOGGER - INFO - Epoch 360 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.970591 grad_norm_before_clip: 2.521785 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:35,086 - TRAIN-LOGGER - INFO - Epoch 360 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883224 weight_norm_u: 25.222990 loss: 0.970468 +RANK_0 - 2026-01-29 02:39:39,273 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN - Minibatch 0: weight_norm_model: 143.883224 loss: 0.970468 grad_norm_before_clip: 2.157476 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:40,413 - TRAIN-LOGGER - INFO - Epoch 361 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883224 weight_norm_u: 25.218954 loss: 0.970468 grad_norm_before_clip: 2.157476 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:40,413 - TRAIN-LOGGER - INFO - Epoch 361 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883240 weight_norm_u: 25.222990 loss: 0.970586 +RANK_0 - 2026-01-29 02:39:44,628 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN - Minibatch 0: weight_norm_model: 143.883240 loss: 0.970586 grad_norm_before_clip: 4.824268 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:45,819 - TRAIN-LOGGER - INFO - Epoch 362 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883240 weight_norm_u: 25.218954 loss: 0.970586 grad_norm_before_clip: 4.824268 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:45,820 - TRAIN-LOGGER - INFO - Epoch 362 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883255 weight_norm_u: 25.222990 loss: 0.970928 +RANK_0 - 2026-01-29 02:39:50,101 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN - Minibatch 0: weight_norm_model: 143.883255 loss: 0.970928 grad_norm_before_clip: 0.922650 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:51,296 - TRAIN-LOGGER - INFO - Epoch 363 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883255 weight_norm_u: 25.218954 loss: 0.970928 grad_norm_before_clip: 0.922650 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:51,296 - TRAIN-LOGGER - INFO - Epoch 363 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883255 weight_norm_u: 25.222990 loss: 0.969794 +RANK_0 - 2026-01-29 02:39:55,699 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN - Minibatch 0: weight_norm_model: 143.883255 loss: 0.969794 grad_norm_before_clip: 3.060274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:56,811 - TRAIN-LOGGER - INFO - Epoch 364 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883255 weight_norm_u: 25.218954 loss: 0.969794 grad_norm_before_clip: 3.060274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:39:56,811 - TRAIN-LOGGER - INFO - Epoch 364 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883240 weight_norm_u: 25.222990 loss: 0.970793 +RANK_0 - 2026-01-29 02:40:01,358 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN - Minibatch 0: weight_norm_model: 143.883240 loss: 0.970793 grad_norm_before_clip: 3.789734 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:02,592 - TRAIN-LOGGER - INFO - Epoch 365 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883240 weight_norm_u: 25.218954 loss: 0.970793 grad_norm_before_clip: 3.789734 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:02,593 - TRAIN-LOGGER - INFO - Epoch 365 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883255 weight_norm_u: 25.222990 loss: 0.971867 +RANK_0 - 2026-01-29 02:40:06,984 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN - Minibatch 0: weight_norm_model: 143.883255 loss: 0.971867 grad_norm_before_clip: 3.818176 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:08,130 - TRAIN-LOGGER - INFO - Epoch 366 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883255 weight_norm_u: 25.218954 loss: 0.971867 grad_norm_before_clip: 3.818176 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:08,130 - TRAIN-LOGGER - INFO - Epoch 366 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883270 weight_norm_u: 25.222990 loss: 0.970553 +RANK_0 - 2026-01-29 02:40:12,554 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN - Minibatch 0: weight_norm_model: 143.883270 loss: 0.970553 grad_norm_before_clip: 1.775052 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:13,720 - TRAIN-LOGGER - INFO - Epoch 367 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883270 weight_norm_u: 25.218954 loss: 0.970553 grad_norm_before_clip: 1.775052 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:13,720 - TRAIN-LOGGER - INFO - Epoch 367 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883301 weight_norm_u: 25.222990 loss: 0.971905 +RANK_0 - 2026-01-29 02:40:18,046 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN - Minibatch 0: weight_norm_model: 143.883301 loss: 0.971905 grad_norm_before_clip: 4.970007 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:19,151 - TRAIN-LOGGER - INFO - Epoch 368 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883301 weight_norm_u: 25.218954 loss: 0.971905 grad_norm_before_clip: 4.970007 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:19,151 - TRAIN-LOGGER - INFO - Epoch 368 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883316 weight_norm_u: 25.222990 loss: 0.973028 +RANK_0 - 2026-01-29 02:40:23,433 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN - Minibatch 0: weight_norm_model: 143.883316 loss: 0.973028 grad_norm_before_clip: 5.167463 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:24,546 - TRAIN-LOGGER - INFO - Epoch 369 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883316 weight_norm_u: 25.218954 loss: 0.973028 grad_norm_before_clip: 5.167463 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:24,546 - TRAIN-LOGGER - INFO - Epoch 369 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883316 weight_norm_u: 25.222990 loss: 0.974003 +RANK_0 - 2026-01-29 02:40:29,265 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN - Minibatch 0: weight_norm_model: 143.883316 loss: 0.974003 grad_norm_before_clip: 3.608373 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:30,386 - TRAIN-LOGGER - INFO - Epoch 370 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883316 weight_norm_u: 25.218954 loss: 0.974003 grad_norm_before_clip: 3.608373 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:30,386 - TRAIN-LOGGER - INFO - Epoch 370 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883331 weight_norm_u: 25.222990 loss: 0.973449 +RANK_0 - 2026-01-29 02:40:35,204 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN - Minibatch 0: weight_norm_model: 143.883331 loss: 0.973449 grad_norm_before_clip: 3.739992 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:36,364 - TRAIN-LOGGER - INFO - Epoch 371 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883331 weight_norm_u: 25.218954 loss: 0.973449 grad_norm_before_clip: 3.739992 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:36,365 - TRAIN-LOGGER - INFO - Epoch 371 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883331 weight_norm_u: 25.222990 loss: 0.969763 +RANK_0 - 2026-01-29 02:40:41,156 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN - Minibatch 0: weight_norm_model: 143.883331 loss: 0.969763 grad_norm_before_clip: 3.675899 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:42,276 - TRAIN-LOGGER - INFO - Epoch 372 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883331 weight_norm_u: 25.218954 loss: 0.969763 grad_norm_before_clip: 3.675899 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:42,276 - TRAIN-LOGGER - INFO - Epoch 372 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883347 weight_norm_u: 25.222990 loss: 0.974908 +RANK_0 - 2026-01-29 02:40:46,943 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN - Minibatch 0: weight_norm_model: 143.883347 loss: 0.974908 grad_norm_before_clip: 5.179137 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:48,104 - TRAIN-LOGGER - INFO - Epoch 373 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883347 weight_norm_u: 25.218954 loss: 0.974908 grad_norm_before_clip: 5.179137 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:48,105 - TRAIN-LOGGER - INFO - Epoch 373 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883362 weight_norm_u: 25.222990 loss: 0.976714 +RANK_0 - 2026-01-29 02:40:52,458 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN - Minibatch 0: weight_norm_model: 143.883362 loss: 0.976714 grad_norm_before_clip: 5.151195 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:53,569 - TRAIN-LOGGER - INFO - Epoch 374 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883362 weight_norm_u: 25.218954 loss: 0.976714 grad_norm_before_clip: 5.151195 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:53,569 - TRAIN-LOGGER - INFO - Epoch 374 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883362 weight_norm_u: 25.222990 loss: 0.973021 +RANK_0 - 2026-01-29 02:40:57,832 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN - Minibatch 0: weight_norm_model: 143.883362 loss: 0.973021 grad_norm_before_clip: 4.633135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:58,957 - TRAIN-LOGGER - INFO - Epoch 375 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883362 weight_norm_u: 25.218954 loss: 0.973021 grad_norm_before_clip: 4.633135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:40:58,957 - TRAIN-LOGGER - INFO - Epoch 375 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883362 weight_norm_u: 25.222990 loss: 0.971063 +RANK_0 - 2026-01-29 02:41:03,248 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN - Minibatch 0: weight_norm_model: 143.883362 loss: 0.971063 grad_norm_before_clip: 2.016772 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:04,385 - TRAIN-LOGGER - INFO - Epoch 376 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883362 weight_norm_u: 25.218954 loss: 0.971063 grad_norm_before_clip: 2.016772 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:04,385 - TRAIN-LOGGER - INFO - Epoch 376 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883377 weight_norm_u: 25.222990 loss: 0.972723 +RANK_0 - 2026-01-29 02:41:08,904 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN - Minibatch 0: weight_norm_model: 143.883377 loss: 0.972723 grad_norm_before_clip: 6.182561 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:10,028 - TRAIN-LOGGER - INFO - Epoch 377 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883377 weight_norm_u: 25.218954 loss: 0.972723 grad_norm_before_clip: 6.182561 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:10,029 - TRAIN-LOGGER - INFO - Epoch 377 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883377 weight_norm_u: 25.222990 loss: 0.972215 +RANK_0 - 2026-01-29 02:41:14,400 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN - Minibatch 0: weight_norm_model: 143.883377 loss: 0.972215 grad_norm_before_clip: 4.881934 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:15,635 - TRAIN-LOGGER - INFO - Epoch 378 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883377 weight_norm_u: 25.218954 loss: 0.972215 grad_norm_before_clip: 4.881934 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:15,635 - TRAIN-LOGGER - INFO - Epoch 378 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883377 weight_norm_u: 25.222990 loss: 0.970115 +RANK_0 - 2026-01-29 02:41:20,213 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN - Minibatch 0: weight_norm_model: 143.883377 loss: 0.970115 grad_norm_before_clip: 3.696775 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:21,435 - TRAIN-LOGGER - INFO - Epoch 379 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883377 weight_norm_u: 25.218954 loss: 0.970115 grad_norm_before_clip: 3.696775 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:21,435 - TRAIN-LOGGER - INFO - Epoch 379 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883392 weight_norm_u: 25.222990 loss: 0.972024 +RANK_0 - 2026-01-29 02:41:25,884 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN - Minibatch 0: weight_norm_model: 143.883392 loss: 0.972024 grad_norm_before_clip: 5.139221 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:27,015 - TRAIN-LOGGER - INFO - Epoch 380 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883392 weight_norm_u: 25.218954 loss: 0.972024 grad_norm_before_clip: 5.139221 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:27,015 - TRAIN-LOGGER - INFO - Epoch 380 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883392 weight_norm_u: 25.222990 loss: 0.975130 +RANK_0 - 2026-01-29 02:41:31,559 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN - Minibatch 0: weight_norm_model: 143.883392 loss: 0.975130 grad_norm_before_clip: 5.081448 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:32,748 - TRAIN-LOGGER - INFO - Epoch 381 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883392 weight_norm_u: 25.218954 loss: 0.975130 grad_norm_before_clip: 5.081448 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:32,748 - TRAIN-LOGGER - INFO - Epoch 381 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883392 weight_norm_u: 25.222990 loss: 0.973597 +RANK_0 - 2026-01-29 02:41:37,168 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN - Minibatch 0: weight_norm_model: 143.883392 loss: 0.973597 grad_norm_before_clip: 5.021895 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:38,316 - TRAIN-LOGGER - INFO - Epoch 382 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883392 weight_norm_u: 25.218954 loss: 0.973597 grad_norm_before_clip: 5.021895 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:38,316 - TRAIN-LOGGER - INFO - Epoch 382 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883392 weight_norm_u: 25.222990 loss: 0.969437 +RANK_0 - 2026-01-29 02:41:43,049 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN - Minibatch 0: weight_norm_model: 143.883392 loss: 0.969437 grad_norm_before_clip: 1.586161 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:44,276 - TRAIN-LOGGER - INFO - Epoch 383 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883392 weight_norm_u: 25.218954 loss: 0.969437 grad_norm_before_clip: 1.586161 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:44,276 - TRAIN-LOGGER - INFO - Epoch 383 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883377 weight_norm_u: 25.222990 loss: 0.973598 +RANK_0 - 2026-01-29 02:41:48,768 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN - Minibatch 0: weight_norm_model: 143.883377 loss: 0.973598 grad_norm_before_clip: 4.992649 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:49,886 - TRAIN-LOGGER - INFO - Epoch 384 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883377 weight_norm_u: 25.218954 loss: 0.973598 grad_norm_before_clip: 4.992649 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:49,886 - TRAIN-LOGGER - INFO - Epoch 384 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883392 weight_norm_u: 25.222990 loss: 0.977217 +RANK_0 - 2026-01-29 02:41:54,359 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN - Minibatch 0: weight_norm_model: 143.883392 loss: 0.977217 grad_norm_before_clip: 6.219995 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:55,508 - TRAIN-LOGGER - INFO - Epoch 385 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883392 weight_norm_u: 25.218954 loss: 0.977217 grad_norm_before_clip: 6.219995 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:41:55,508 - TRAIN-LOGGER - INFO - Epoch 385 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883408 weight_norm_u: 25.222990 loss: 0.976009 +RANK_0 - 2026-01-29 02:41:59,661 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN - Minibatch 0: weight_norm_model: 143.883408 loss: 0.976009 grad_norm_before_clip: 6.030264 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:00,836 - TRAIN-LOGGER - INFO - Epoch 386 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883408 weight_norm_u: 25.218954 loss: 0.976009 grad_norm_before_clip: 6.030264 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:00,836 - TRAIN-LOGGER - INFO - Epoch 386 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.969204 +RANK_0 - 2026-01-29 02:42:05,389 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.969204 grad_norm_before_clip: 2.183093 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:06,520 - TRAIN-LOGGER - INFO - Epoch 387 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.969204 grad_norm_before_clip: 2.183093 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:06,520 - TRAIN-LOGGER - INFO - Epoch 387 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.976775 +RANK_0 - 2026-01-29 02:42:11,096 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.976775 grad_norm_before_clip: 5.124621 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:12,307 - TRAIN-LOGGER - INFO - Epoch 388 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.976775 grad_norm_before_clip: 5.124621 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:12,307 - TRAIN-LOGGER - INFO - Epoch 388 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.982757 +RANK_0 - 2026-01-29 02:42:16,812 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.982757 grad_norm_before_clip: 6.385272 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:17,961 - TRAIN-LOGGER - INFO - Epoch 389 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.982757 grad_norm_before_clip: 6.385272 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:17,961 - TRAIN-LOGGER - INFO - Epoch 389 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.981008 +RANK_0 - 2026-01-29 02:42:22,108 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.981008 grad_norm_before_clip: 6.405149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:23,269 - TRAIN-LOGGER - INFO - Epoch 390 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.981008 grad_norm_before_clip: 6.405149 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:23,269 - TRAIN-LOGGER - INFO - Epoch 390 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.973929 +RANK_0 - 2026-01-29 02:42:27,494 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.973929 grad_norm_before_clip: 4.755834 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:28,640 - TRAIN-LOGGER - INFO - Epoch 391 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.973929 grad_norm_before_clip: 4.755834 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:28,640 - TRAIN-LOGGER - INFO - Epoch 391 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883408 weight_norm_u: 25.222990 loss: 0.969797 +RANK_0 - 2026-01-29 02:42:32,725 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN - Minibatch 0: weight_norm_model: 143.883408 loss: 0.969797 grad_norm_before_clip: 2.314276 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:33,871 - TRAIN-LOGGER - INFO - Epoch 392 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883408 weight_norm_u: 25.218954 loss: 0.969797 grad_norm_before_clip: 2.314276 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:33,871 - TRAIN-LOGGER - INFO - Epoch 392 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883408 weight_norm_u: 25.222990 loss: 0.973519 +RANK_0 - 2026-01-29 02:42:37,993 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN - Minibatch 0: weight_norm_model: 143.883408 loss: 0.973519 grad_norm_before_clip: 4.980041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:39,212 - TRAIN-LOGGER - INFO - Epoch 393 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883408 weight_norm_u: 25.218954 loss: 0.973519 grad_norm_before_clip: 4.980041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:39,213 - TRAIN-LOGGER - INFO - Epoch 393 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883408 weight_norm_u: 25.222990 loss: 0.973526 +RANK_0 - 2026-01-29 02:42:43,191 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN - Minibatch 0: weight_norm_model: 143.883408 loss: 0.973526 grad_norm_before_clip: 4.899091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:44,320 - TRAIN-LOGGER - INFO - Epoch 394 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883408 weight_norm_u: 25.218954 loss: 0.973526 grad_norm_before_clip: 4.899091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:44,321 - TRAIN-LOGGER - INFO - Epoch 394 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883423 weight_norm_u: 25.222990 loss: 0.970555 +RANK_0 - 2026-01-29 02:42:48,499 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN - Minibatch 0: weight_norm_model: 143.883423 loss: 0.970555 grad_norm_before_clip: 2.005825 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:49,637 - TRAIN-LOGGER - INFO - Epoch 395 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883423 weight_norm_u: 25.218954 loss: 0.970555 grad_norm_before_clip: 2.005825 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:49,637 - TRAIN-LOGGER - INFO - Epoch 395 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883438 weight_norm_u: 25.222990 loss: 0.971019 +RANK_0 - 2026-01-29 02:42:53,886 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN - Minibatch 0: weight_norm_model: 143.883438 loss: 0.971019 grad_norm_before_clip: 3.087617 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:55,040 - TRAIN-LOGGER - INFO - Epoch 396 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883438 weight_norm_u: 25.218954 loss: 0.971019 grad_norm_before_clip: 3.087617 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:42:55,041 - TRAIN-LOGGER - INFO - Epoch 396 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883453 weight_norm_u: 25.222990 loss: 0.972048 +RANK_0 - 2026-01-29 02:42:59,374 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN - Minibatch 0: weight_norm_model: 143.883453 loss: 0.972048 grad_norm_before_clip: 4.350880 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:00,507 - TRAIN-LOGGER - INFO - Epoch 397 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883453 weight_norm_u: 25.218954 loss: 0.972048 grad_norm_before_clip: 4.350880 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:00,507 - TRAIN-LOGGER - INFO - Epoch 397 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883469 weight_norm_u: 25.222990 loss: 0.969206 +RANK_0 - 2026-01-29 02:43:04,592 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN - Minibatch 0: weight_norm_model: 143.883469 loss: 0.969206 grad_norm_before_clip: 1.688768 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:05,718 - TRAIN-LOGGER - INFO - Epoch 398 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883469 weight_norm_u: 25.218954 loss: 0.969206 grad_norm_before_clip: 1.688768 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:05,718 - TRAIN-LOGGER - INFO - Epoch 398 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883484 weight_norm_u: 25.222990 loss: 0.970789 +RANK_0 - 2026-01-29 02:43:09,804 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN - Minibatch 0: weight_norm_model: 143.883484 loss: 0.970789 grad_norm_before_clip: 3.614949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:10,996 - TRAIN-LOGGER - INFO - Epoch 399 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883484 weight_norm_u: 25.218954 loss: 0.970789 grad_norm_before_clip: 3.614949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:10,996 - TRAIN-LOGGER - INFO - Epoch 399 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883469 weight_norm_u: 25.222990 loss: 0.971885 +RANK_0 - 2026-01-29 02:43:15,158 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN - Minibatch 0: weight_norm_model: 143.883469 loss: 0.971885 grad_norm_before_clip: 4.058433 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:16,278 - TRAIN-LOGGER - INFO - Epoch 400 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883469 weight_norm_u: 25.218954 loss: 0.971885 grad_norm_before_clip: 4.058433 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:16,278 - TRAIN-LOGGER - INFO - Epoch 400 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883484 weight_norm_u: 25.222990 loss: 0.972180 +RANK_0 - 2026-01-29 02:43:20,848 - TRAIN-LOGGER - INFO - Epoch 401 - TRAIN - Minibatch 0: weight_norm_model: 143.883484 loss: 0.972180 grad_norm_before_clip: 4.279538 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:22,003 - TRAIN-LOGGER - INFO - Epoch 401 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883484 weight_norm_u: 25.218954 loss: 0.972180 grad_norm_before_clip: 4.279538 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:22,003 - TRAIN-LOGGER - INFO - Epoch 401 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883484 weight_norm_u: 25.222990 loss: 0.970794 +RANK_0 - 2026-01-29 02:43:26,214 - TRAIN-LOGGER - INFO - Epoch 402 - TRAIN - Minibatch 0: weight_norm_model: 143.883484 loss: 0.970794 grad_norm_before_clip: 1.735718 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:27,345 - TRAIN-LOGGER - INFO - Epoch 402 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883484 weight_norm_u: 25.218954 loss: 0.970794 grad_norm_before_clip: 1.735718 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:27,345 - TRAIN-LOGGER - INFO - Epoch 402 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883514 weight_norm_u: 25.222990 loss: 0.971525 +RANK_0 - 2026-01-29 02:43:31,960 - TRAIN-LOGGER - INFO - Epoch 403 - TRAIN - Minibatch 0: weight_norm_model: 143.883514 loss: 0.971525 grad_norm_before_clip: 2.391685 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:33,171 - TRAIN-LOGGER - INFO - Epoch 403 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883514 weight_norm_u: 25.218954 loss: 0.971525 grad_norm_before_clip: 2.391685 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:33,172 - TRAIN-LOGGER - INFO - Epoch 403 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883514 weight_norm_u: 25.222990 loss: 0.971340 +RANK_0 - 2026-01-29 02:43:37,227 - TRAIN-LOGGER - INFO - Epoch 404 - TRAIN - Minibatch 0: weight_norm_model: 143.883514 loss: 0.971340 grad_norm_before_clip: 3.201591 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:38,359 - TRAIN-LOGGER - INFO - Epoch 404 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883514 weight_norm_u: 25.218954 loss: 0.971340 grad_norm_before_clip: 3.201591 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:38,359 - TRAIN-LOGGER - INFO - Epoch 404 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883514 weight_norm_u: 25.222990 loss: 0.970418 +RANK_0 - 2026-01-29 02:43:42,363 - TRAIN-LOGGER - INFO - Epoch 405 - TRAIN - Minibatch 0: weight_norm_model: 143.883514 loss: 0.970418 grad_norm_before_clip: 1.704062 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:43,515 - TRAIN-LOGGER - INFO - Epoch 405 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883514 weight_norm_u: 25.218954 loss: 0.970418 grad_norm_before_clip: 1.704062 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:43,515 - TRAIN-LOGGER - INFO - Epoch 405 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883514 weight_norm_u: 25.222990 loss: 0.971576 +RANK_0 - 2026-01-29 02:43:48,049 - TRAIN-LOGGER - INFO - Epoch 406 - TRAIN - Minibatch 0: weight_norm_model: 143.883514 loss: 0.971576 grad_norm_before_clip: 3.188148 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:49,223 - TRAIN-LOGGER - INFO - Epoch 406 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883514 weight_norm_u: 25.218954 loss: 0.971576 grad_norm_before_clip: 3.188148 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:49,223 - TRAIN-LOGGER - INFO - Epoch 406 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883514 weight_norm_u: 25.222990 loss: 0.969616 +RANK_0 - 2026-01-29 02:43:53,769 - TRAIN-LOGGER - INFO - Epoch 407 - TRAIN - Minibatch 0: weight_norm_model: 143.883514 loss: 0.969616 grad_norm_before_clip: 3.218454 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:54,994 - TRAIN-LOGGER - INFO - Epoch 407 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883514 weight_norm_u: 25.218954 loss: 0.969616 grad_norm_before_clip: 3.218454 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:43:54,994 - TRAIN-LOGGER - INFO - Epoch 407 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.972000 +RANK_0 - 2026-01-29 02:43:59,302 - TRAIN-LOGGER - INFO - Epoch 408 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.972000 grad_norm_before_clip: 4.354096 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:00,516 - TRAIN-LOGGER - INFO - Epoch 408 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.972000 grad_norm_before_clip: 4.354096 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:00,516 - TRAIN-LOGGER - INFO - Epoch 408 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.971321 +RANK_0 - 2026-01-29 02:44:04,952 - TRAIN-LOGGER - INFO - Epoch 409 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.971321 grad_norm_before_clip: 3.904480 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:06,146 - TRAIN-LOGGER - INFO - Epoch 409 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.971321 grad_norm_before_clip: 3.904480 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:06,146 - TRAIN-LOGGER - INFO - Epoch 409 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.969481 +RANK_0 - 2026-01-29 02:44:10,585 - TRAIN-LOGGER - INFO - Epoch 410 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.969481 grad_norm_before_clip: 2.681925 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:11,699 - TRAIN-LOGGER - INFO - Epoch 410 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.969481 grad_norm_before_clip: 2.681925 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:11,699 - TRAIN-LOGGER - INFO - Epoch 410 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883530 weight_norm_u: 25.222990 loss: 0.969658 +RANK_0 - 2026-01-29 02:44:15,913 - TRAIN-LOGGER - INFO - Epoch 411 - TRAIN - Minibatch 0: weight_norm_model: 143.883530 loss: 0.969658 grad_norm_before_clip: 3.095380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:17,045 - TRAIN-LOGGER - INFO - Epoch 411 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883530 weight_norm_u: 25.218954 loss: 0.969658 grad_norm_before_clip: 3.095380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:17,045 - TRAIN-LOGGER - INFO - Epoch 411 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883530 weight_norm_u: 25.222990 loss: 0.971893 +RANK_0 - 2026-01-29 02:44:21,303 - TRAIN-LOGGER - INFO - Epoch 412 - TRAIN - Minibatch 0: weight_norm_model: 143.883530 loss: 0.971893 grad_norm_before_clip: 4.410420 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:22,430 - TRAIN-LOGGER - INFO - Epoch 412 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883530 weight_norm_u: 25.218954 loss: 0.971893 grad_norm_before_clip: 4.410420 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:22,430 - TRAIN-LOGGER - INFO - Epoch 412 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883545 weight_norm_u: 25.222990 loss: 0.971576 +RANK_0 - 2026-01-29 02:44:26,512 - TRAIN-LOGGER - INFO - Epoch 413 - TRAIN - Minibatch 0: weight_norm_model: 143.883545 loss: 0.971576 grad_norm_before_clip: 2.425022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:27,648 - TRAIN-LOGGER - INFO - Epoch 413 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883545 weight_norm_u: 25.218954 loss: 0.971576 grad_norm_before_clip: 2.425022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:27,649 - TRAIN-LOGGER - INFO - Epoch 413 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883560 weight_norm_u: 25.222990 loss: 0.971095 +RANK_0 - 2026-01-29 02:44:31,674 - TRAIN-LOGGER - INFO - Epoch 414 - TRAIN - Minibatch 0: weight_norm_model: 143.883560 loss: 0.971095 grad_norm_before_clip: 2.002315 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:32,862 - TRAIN-LOGGER - INFO - Epoch 414 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883560 weight_norm_u: 25.218954 loss: 0.971095 grad_norm_before_clip: 2.002315 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:32,862 - TRAIN-LOGGER - INFO - Epoch 414 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883575 weight_norm_u: 25.222990 loss: 0.971569 +RANK_0 - 2026-01-29 02:44:37,002 - TRAIN-LOGGER - INFO - Epoch 415 - TRAIN - Minibatch 0: weight_norm_model: 143.883575 loss: 0.971569 grad_norm_before_clip: 4.262305 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:38,094 - TRAIN-LOGGER - INFO - Epoch 415 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883575 weight_norm_u: 25.218954 loss: 0.971569 grad_norm_before_clip: 4.262305 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:38,094 - TRAIN-LOGGER - INFO - Epoch 415 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883575 weight_norm_u: 25.222990 loss: 0.969461 +RANK_0 - 2026-01-29 02:44:42,307 - TRAIN-LOGGER - INFO - Epoch 416 - TRAIN - Minibatch 0: weight_norm_model: 143.883575 loss: 0.969461 grad_norm_before_clip: 4.072378 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:43,417 - TRAIN-LOGGER - INFO - Epoch 416 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883575 weight_norm_u: 25.218954 loss: 0.969461 grad_norm_before_clip: 4.072378 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:43,418 - TRAIN-LOGGER - INFO - Epoch 416 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883575 weight_norm_u: 25.222990 loss: 0.971782 +RANK_0 - 2026-01-29 02:44:47,723 - TRAIN-LOGGER - INFO - Epoch 417 - TRAIN - Minibatch 0: weight_norm_model: 143.883575 loss: 0.971782 grad_norm_before_clip: 4.688401 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:48,915 - TRAIN-LOGGER - INFO - Epoch 417 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883575 weight_norm_u: 25.218954 loss: 0.971782 grad_norm_before_clip: 4.688401 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:48,915 - TRAIN-LOGGER - INFO - Epoch 417 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883591 weight_norm_u: 25.222990 loss: 0.972921 +RANK_0 - 2026-01-29 02:44:53,396 - TRAIN-LOGGER - INFO - Epoch 418 - TRAIN - Minibatch 0: weight_norm_model: 143.883591 loss: 0.972921 grad_norm_before_clip: 4.379273 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:54,521 - TRAIN-LOGGER - INFO - Epoch 418 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883591 weight_norm_u: 25.218954 loss: 0.972921 grad_norm_before_clip: 4.379273 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:44:54,522 - TRAIN-LOGGER - INFO - Epoch 418 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883606 weight_norm_u: 25.222990 loss: 0.969723 +RANK_0 - 2026-01-29 02:44:58,861 - TRAIN-LOGGER - INFO - Epoch 419 - TRAIN - Minibatch 0: weight_norm_model: 143.883606 loss: 0.969723 grad_norm_before_clip: 3.401862 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:00,062 - TRAIN-LOGGER - INFO - Epoch 419 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883606 weight_norm_u: 25.218954 loss: 0.969723 grad_norm_before_clip: 3.401862 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:00,062 - TRAIN-LOGGER - INFO - Epoch 419 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883621 weight_norm_u: 25.222990 loss: 0.968013 +RANK_0 - 2026-01-29 02:45:04,857 - TRAIN-LOGGER - INFO - Epoch 420 - TRAIN - Minibatch 0: weight_norm_model: 143.883621 loss: 0.968013 grad_norm_before_clip: 2.082045 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:06,065 - TRAIN-LOGGER - INFO - Epoch 420 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883621 weight_norm_u: 25.218954 loss: 0.968013 grad_norm_before_clip: 2.082045 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:06,065 - TRAIN-LOGGER - INFO - Epoch 420 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883636 weight_norm_u: 25.222990 loss: 0.968516 +RANK_0 - 2026-01-29 02:45:10,556 - TRAIN-LOGGER - INFO - Epoch 421 - TRAIN - Minibatch 0: weight_norm_model: 143.883636 loss: 0.968516 grad_norm_before_clip: 1.804879 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:11,751 - TRAIN-LOGGER - INFO - Epoch 421 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883636 weight_norm_u: 25.218954 loss: 0.968516 grad_norm_before_clip: 1.804879 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:11,751 - TRAIN-LOGGER - INFO - Epoch 421 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883636 weight_norm_u: 25.222990 loss: 0.969489 +RANK_0 - 2026-01-29 02:45:16,115 - TRAIN-LOGGER - INFO - Epoch 422 - TRAIN - Minibatch 0: weight_norm_model: 143.883636 loss: 0.969489 grad_norm_before_clip: 4.660087 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:17,258 - TRAIN-LOGGER - INFO - Epoch 422 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883636 weight_norm_u: 25.218954 loss: 0.969489 grad_norm_before_clip: 4.660087 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:17,259 - TRAIN-LOGGER - INFO - Epoch 422 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883652 weight_norm_u: 25.222990 loss: 0.968777 +RANK_0 - 2026-01-29 02:45:21,752 - TRAIN-LOGGER - INFO - Epoch 423 - TRAIN - Minibatch 0: weight_norm_model: 143.883652 loss: 0.968777 grad_norm_before_clip: 2.240632 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:22,878 - TRAIN-LOGGER - INFO - Epoch 423 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883652 weight_norm_u: 25.218954 loss: 0.968777 grad_norm_before_clip: 2.240632 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:22,878 - TRAIN-LOGGER - INFO - Epoch 423 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883652 weight_norm_u: 25.222990 loss: 0.968259 +RANK_0 - 2026-01-29 02:45:27,662 - TRAIN-LOGGER - INFO - Epoch 424 - TRAIN - Minibatch 0: weight_norm_model: 143.883652 loss: 0.968259 grad_norm_before_clip: 2.335515 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:28,857 - TRAIN-LOGGER - INFO - Epoch 424 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883652 weight_norm_u: 25.218954 loss: 0.968259 grad_norm_before_clip: 2.335515 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:28,857 - TRAIN-LOGGER - INFO - Epoch 424 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883667 weight_norm_u: 25.222990 loss: 0.967781 +RANK_0 - 2026-01-29 02:45:34,004 - TRAIN-LOGGER - INFO - Epoch 425 - TRAIN - Minibatch 0: weight_norm_model: 143.883667 loss: 0.967781 grad_norm_before_clip: 2.742704 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:35,222 - TRAIN-LOGGER - INFO - Epoch 425 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883667 weight_norm_u: 25.218954 loss: 0.967781 grad_norm_before_clip: 2.742704 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:35,223 - TRAIN-LOGGER - INFO - Epoch 425 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883667 weight_norm_u: 25.222990 loss: 0.969711 +RANK_0 - 2026-01-29 02:45:40,052 - TRAIN-LOGGER - INFO - Epoch 426 - TRAIN - Minibatch 0: weight_norm_model: 143.883667 loss: 0.969711 grad_norm_before_clip: 4.838389 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:41,209 - TRAIN-LOGGER - INFO - Epoch 426 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883667 weight_norm_u: 25.218954 loss: 0.969711 grad_norm_before_clip: 4.838389 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:41,209 - TRAIN-LOGGER - INFO - Epoch 426 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883682 weight_norm_u: 25.222990 loss: 0.972693 +RANK_0 - 2026-01-29 02:45:45,791 - TRAIN-LOGGER - INFO - Epoch 427 - TRAIN - Minibatch 0: weight_norm_model: 143.883682 loss: 0.972693 grad_norm_before_clip: 4.771881 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:46,933 - TRAIN-LOGGER - INFO - Epoch 427 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883682 weight_norm_u: 25.218954 loss: 0.972693 grad_norm_before_clip: 4.771881 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:46,933 - TRAIN-LOGGER - INFO - Epoch 427 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883698 weight_norm_u: 25.222990 loss: 0.969037 +RANK_0 - 2026-01-29 02:45:51,475 - TRAIN-LOGGER - INFO - Epoch 428 - TRAIN - Minibatch 0: weight_norm_model: 143.883698 loss: 0.969037 grad_norm_before_clip: 2.534036 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:52,585 - TRAIN-LOGGER - INFO - Epoch 428 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883698 weight_norm_u: 25.218954 loss: 0.969037 grad_norm_before_clip: 2.534036 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:52,585 - TRAIN-LOGGER - INFO - Epoch 428 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883698 weight_norm_u: 25.222990 loss: 0.968500 +RANK_0 - 2026-01-29 02:45:56,740 - TRAIN-LOGGER - INFO - Epoch 429 - TRAIN - Minibatch 0: weight_norm_model: 143.883698 loss: 0.968500 grad_norm_before_clip: 4.533125 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:57,929 - TRAIN-LOGGER - INFO - Epoch 429 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883698 weight_norm_u: 25.218954 loss: 0.968500 grad_norm_before_clip: 4.533125 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:45:57,929 - TRAIN-LOGGER - INFO - Epoch 429 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883713 weight_norm_u: 25.222990 loss: 0.968237 +RANK_0 - 2026-01-29 02:46:02,079 - TRAIN-LOGGER - INFO - Epoch 430 - TRAIN - Minibatch 0: weight_norm_model: 143.883713 loss: 0.968237 grad_norm_before_clip: 1.800361 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:03,301 - TRAIN-LOGGER - INFO - Epoch 430 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883713 weight_norm_u: 25.218954 loss: 0.968237 grad_norm_before_clip: 1.800361 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:03,301 - TRAIN-LOGGER - INFO - Epoch 430 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883743 weight_norm_u: 25.222990 loss: 0.969393 +RANK_0 - 2026-01-29 02:46:07,503 - TRAIN-LOGGER - INFO - Epoch 431 - TRAIN - Minibatch 0: weight_norm_model: 143.883743 loss: 0.969393 grad_norm_before_clip: 2.450443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:08,624 - TRAIN-LOGGER - INFO - Epoch 431 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883743 weight_norm_u: 25.218954 loss: 0.969393 grad_norm_before_clip: 2.450443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:08,624 - TRAIN-LOGGER - INFO - Epoch 431 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.970199 +RANK_0 - 2026-01-29 02:46:12,828 - TRAIN-LOGGER - INFO - Epoch 432 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.970199 grad_norm_before_clip: 4.338974 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:14,021 - TRAIN-LOGGER - INFO - Epoch 432 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.970199 grad_norm_before_clip: 4.338974 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:14,021 - TRAIN-LOGGER - INFO - Epoch 432 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.967911 +RANK_0 - 2026-01-29 02:46:18,718 - TRAIN-LOGGER - INFO - Epoch 433 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.967911 grad_norm_before_clip: 1.877943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:19,864 - TRAIN-LOGGER - INFO - Epoch 433 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.967911 grad_norm_before_clip: 1.877943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:19,864 - TRAIN-LOGGER - INFO - Epoch 433 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.968341 +RANK_0 - 2026-01-29 02:46:24,098 - TRAIN-LOGGER - INFO - Epoch 434 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.968341 grad_norm_before_clip: 3.033997 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:25,220 - TRAIN-LOGGER - INFO - Epoch 434 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.968341 grad_norm_before_clip: 3.033997 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:25,220 - TRAIN-LOGGER - INFO - Epoch 434 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883759 weight_norm_u: 25.222990 loss: 0.967739 +RANK_0 - 2026-01-29 02:46:29,890 - TRAIN-LOGGER - INFO - Epoch 435 - TRAIN - Minibatch 0: weight_norm_model: 143.883759 loss: 0.967739 grad_norm_before_clip: 3.059315 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:31,125 - TRAIN-LOGGER - INFO - Epoch 435 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883759 weight_norm_u: 25.218954 loss: 0.967739 grad_norm_before_clip: 3.059315 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:31,126 - TRAIN-LOGGER - INFO - Epoch 435 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883774 weight_norm_u: 25.222990 loss: 0.967543 +RANK_0 - 2026-01-29 02:46:35,188 - TRAIN-LOGGER - INFO - Epoch 436 - TRAIN - Minibatch 0: weight_norm_model: 143.883774 loss: 0.967543 grad_norm_before_clip: 2.156787 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:36,299 - TRAIN-LOGGER - INFO - Epoch 436 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883774 weight_norm_u: 25.218954 loss: 0.967543 grad_norm_before_clip: 2.156787 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:36,299 - TRAIN-LOGGER - INFO - Epoch 436 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.969261 +RANK_0 - 2026-01-29 02:46:40,599 - TRAIN-LOGGER - INFO - Epoch 437 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.969261 grad_norm_before_clip: 2.430205 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:41,824 - TRAIN-LOGGER - INFO - Epoch 437 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.969261 grad_norm_before_clip: 2.430205 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:41,824 - TRAIN-LOGGER - INFO - Epoch 437 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.970586 +RANK_0 - 2026-01-29 02:46:50,023 - TRAIN-LOGGER - INFO - Epoch 438 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.970586 grad_norm_before_clip: 3.546367 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:51,187 - TRAIN-LOGGER - INFO - Epoch 438 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.970586 grad_norm_before_clip: 3.546367 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:51,187 - TRAIN-LOGGER - INFO - Epoch 438 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883789 weight_norm_u: 25.222990 loss: 0.970061 +RANK_0 - 2026-01-29 02:46:56,874 - TRAIN-LOGGER - INFO - Epoch 439 - TRAIN - Minibatch 0: weight_norm_model: 143.883789 loss: 0.970061 grad_norm_before_clip: 3.801143 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:58,078 - TRAIN-LOGGER - INFO - Epoch 439 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883789 weight_norm_u: 25.218954 loss: 0.970061 grad_norm_before_clip: 3.801143 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:46:58,079 - TRAIN-LOGGER - INFO - Epoch 439 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883804 weight_norm_u: 25.222990 loss: 0.968836 +RANK_0 - 2026-01-29 02:47:02,980 - TRAIN-LOGGER - INFO - Epoch 440 - TRAIN - Minibatch 0: weight_norm_model: 143.883804 loss: 0.968836 grad_norm_before_clip: 2.285977 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:04,134 - TRAIN-LOGGER - INFO - Epoch 440 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883804 weight_norm_u: 25.218954 loss: 0.968836 grad_norm_before_clip: 2.285977 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:04,134 - TRAIN-LOGGER - INFO - Epoch 440 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883820 weight_norm_u: 25.222990 loss: 0.971154 +RANK_0 - 2026-01-29 02:47:08,989 - TRAIN-LOGGER - INFO - Epoch 441 - TRAIN - Minibatch 0: weight_norm_model: 143.883820 loss: 0.971154 grad_norm_before_clip: 4.904223 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:10,190 - TRAIN-LOGGER - INFO - Epoch 441 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883820 weight_norm_u: 25.218954 loss: 0.971154 grad_norm_before_clip: 4.904223 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:10,190 - TRAIN-LOGGER - INFO - Epoch 441 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.973169 +RANK_0 - 2026-01-29 02:47:14,308 - TRAIN-LOGGER - INFO - Epoch 442 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.973169 grad_norm_before_clip: 5.199629 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:15,555 - TRAIN-LOGGER - INFO - Epoch 442 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.973169 grad_norm_before_clip: 5.199629 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:15,555 - TRAIN-LOGGER - INFO - Epoch 442 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.970129 +RANK_0 - 2026-01-29 02:47:19,712 - TRAIN-LOGGER - INFO - Epoch 443 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.970129 grad_norm_before_clip: 2.525506 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:20,852 - TRAIN-LOGGER - INFO - Epoch 443 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.970129 grad_norm_before_clip: 2.525506 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:20,853 - TRAIN-LOGGER - INFO - Epoch 443 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883850 weight_norm_u: 25.222990 loss: 0.972733 +RANK_0 - 2026-01-29 02:47:25,061 - TRAIN-LOGGER - INFO - Epoch 444 - TRAIN - Minibatch 0: weight_norm_model: 143.883850 loss: 0.972733 grad_norm_before_clip: 5.120247 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:26,173 - TRAIN-LOGGER - INFO - Epoch 444 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883850 weight_norm_u: 25.218954 loss: 0.972733 grad_norm_before_clip: 5.120247 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:26,174 - TRAIN-LOGGER - INFO - Epoch 444 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883865 weight_norm_u: 25.222990 loss: 0.967644 +RANK_0 - 2026-01-29 02:47:30,314 - TRAIN-LOGGER - INFO - Epoch 445 - TRAIN - Minibatch 0: weight_norm_model: 143.883865 loss: 0.967644 grad_norm_before_clip: 4.370812 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:31,422 - TRAIN-LOGGER - INFO - Epoch 445 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883865 weight_norm_u: 25.218954 loss: 0.967644 grad_norm_before_clip: 4.370812 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:31,422 - TRAIN-LOGGER - INFO - Epoch 445 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883881 weight_norm_u: 25.222990 loss: 0.968682 +RANK_0 - 2026-01-29 02:47:35,678 - TRAIN-LOGGER - INFO - Epoch 446 - TRAIN - Minibatch 0: weight_norm_model: 143.883881 loss: 0.968682 grad_norm_before_clip: 3.939969 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:36,804 - TRAIN-LOGGER - INFO - Epoch 446 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883881 weight_norm_u: 25.218954 loss: 0.968682 grad_norm_before_clip: 3.939969 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:36,804 - TRAIN-LOGGER - INFO - Epoch 446 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883896 weight_norm_u: 25.222990 loss: 0.968861 +RANK_0 - 2026-01-29 02:47:41,070 - TRAIN-LOGGER - INFO - Epoch 447 - TRAIN - Minibatch 0: weight_norm_model: 143.883896 loss: 0.968861 grad_norm_before_clip: 4.539585 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:42,184 - TRAIN-LOGGER - INFO - Epoch 447 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883896 weight_norm_u: 25.218954 loss: 0.968861 grad_norm_before_clip: 4.539585 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:42,185 - TRAIN-LOGGER - INFO - Epoch 447 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883911 weight_norm_u: 25.222990 loss: 0.967813 +RANK_0 - 2026-01-29 02:47:46,391 - TRAIN-LOGGER - INFO - Epoch 448 - TRAIN - Minibatch 0: weight_norm_model: 143.883911 loss: 0.967813 grad_norm_before_clip: 1.429762 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:47,574 - TRAIN-LOGGER - INFO - Epoch 448 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883911 weight_norm_u: 25.218954 loss: 0.967813 grad_norm_before_clip: 1.429762 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:47,574 - TRAIN-LOGGER - INFO - Epoch 448 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883911 weight_norm_u: 25.222990 loss: 0.966703 +RANK_0 - 2026-01-29 02:47:51,880 - TRAIN-LOGGER - INFO - Epoch 449 - TRAIN - Minibatch 0: weight_norm_model: 143.883911 loss: 0.966703 grad_norm_before_clip: 1.345650 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:53,012 - TRAIN-LOGGER - INFO - Epoch 449 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883911 weight_norm_u: 25.218954 loss: 0.966703 grad_norm_before_clip: 1.345650 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:53,013 - TRAIN-LOGGER - INFO - Epoch 449 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883911 weight_norm_u: 25.222990 loss: 0.968963 +RANK_0 - 2026-01-29 02:47:57,524 - TRAIN-LOGGER - INFO - Epoch 450 - TRAIN - Minibatch 0: weight_norm_model: 143.883911 loss: 0.968963 grad_norm_before_clip: 4.062405 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:58,722 - TRAIN-LOGGER - INFO - Epoch 450 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883911 weight_norm_u: 25.218954 loss: 0.968963 grad_norm_before_clip: 4.062405 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:47:58,722 - TRAIN-LOGGER - INFO - Epoch 450 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883911 weight_norm_u: 25.222990 loss: 0.969554 +RANK_0 - 2026-01-29 02:48:03,162 - TRAIN-LOGGER - INFO - Epoch 451 - TRAIN - Minibatch 0: weight_norm_model: 143.883911 loss: 0.969554 grad_norm_before_clip: 3.708669 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:04,313 - TRAIN-LOGGER - INFO - Epoch 451 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883911 weight_norm_u: 25.218954 loss: 0.969554 grad_norm_before_clip: 3.708669 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:04,314 - TRAIN-LOGGER - INFO - Epoch 451 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883926 weight_norm_u: 25.222990 loss: 0.970441 +RANK_0 - 2026-01-29 02:48:08,363 - TRAIN-LOGGER - INFO - Epoch 452 - TRAIN - Minibatch 0: weight_norm_model: 143.883926 loss: 0.970441 grad_norm_before_clip: 3.194953 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:09,486 - TRAIN-LOGGER - INFO - Epoch 452 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883926 weight_norm_u: 25.218954 loss: 0.970441 grad_norm_before_clip: 3.194953 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:09,486 - TRAIN-LOGGER - INFO - Epoch 452 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883942 weight_norm_u: 25.222990 loss: 0.968699 +RANK_0 - 2026-01-29 02:48:13,722 - TRAIN-LOGGER - INFO - Epoch 453 - TRAIN - Minibatch 0: weight_norm_model: 143.883942 loss: 0.968699 grad_norm_before_clip: 2.495042 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:15,005 - TRAIN-LOGGER - INFO - Epoch 453 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883942 weight_norm_u: 25.218954 loss: 0.968699 grad_norm_before_clip: 2.495042 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:15,006 - TRAIN-LOGGER - INFO - Epoch 453 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883957 weight_norm_u: 25.222990 loss: 0.968339 +RANK_0 - 2026-01-29 02:48:20,630 - TRAIN-LOGGER - INFO - Epoch 454 - TRAIN - Minibatch 0: weight_norm_model: 143.883957 loss: 0.968339 grad_norm_before_clip: 3.204031 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:21,857 - TRAIN-LOGGER - INFO - Epoch 454 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883957 weight_norm_u: 25.218954 loss: 0.968339 grad_norm_before_clip: 3.204031 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:21,857 - TRAIN-LOGGER - INFO - Epoch 454 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883972 weight_norm_u: 25.222990 loss: 0.967962 +RANK_0 - 2026-01-29 02:48:26,887 - TRAIN-LOGGER - INFO - Epoch 455 - TRAIN - Minibatch 0: weight_norm_model: 143.883972 loss: 0.967962 grad_norm_before_clip: 4.221749 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:28,421 - TRAIN-LOGGER - INFO - Epoch 455 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883972 weight_norm_u: 25.218954 loss: 0.967962 grad_norm_before_clip: 4.221749 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:28,421 - TRAIN-LOGGER - INFO - Epoch 455 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883972 weight_norm_u: 25.222990 loss: 0.968974 +RANK_0 - 2026-01-29 02:48:33,812 - TRAIN-LOGGER - INFO - Epoch 456 - TRAIN - Minibatch 0: weight_norm_model: 143.883972 loss: 0.968974 grad_norm_before_clip: 3.848922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:34,958 - TRAIN-LOGGER - INFO - Epoch 456 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883972 weight_norm_u: 25.218954 loss: 0.968974 grad_norm_before_clip: 3.848922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:34,959 - TRAIN-LOGGER - INFO - Epoch 456 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883972 weight_norm_u: 25.222990 loss: 0.969647 +RANK_0 - 2026-01-29 02:48:39,512 - TRAIN-LOGGER - INFO - Epoch 457 - TRAIN - Minibatch 0: weight_norm_model: 143.883972 loss: 0.969647 grad_norm_before_clip: 3.997488 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:40,680 - TRAIN-LOGGER - INFO - Epoch 457 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883972 weight_norm_u: 25.218954 loss: 0.969647 grad_norm_before_clip: 3.997488 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:40,680 - TRAIN-LOGGER - INFO - Epoch 457 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883972 weight_norm_u: 25.222990 loss: 0.971517 +RANK_0 - 2026-01-29 02:48:45,588 - TRAIN-LOGGER - INFO - Epoch 458 - TRAIN - Minibatch 0: weight_norm_model: 143.883972 loss: 0.971517 grad_norm_before_clip: 4.380434 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:46,813 - TRAIN-LOGGER - INFO - Epoch 458 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883972 weight_norm_u: 25.218954 loss: 0.971517 grad_norm_before_clip: 4.380434 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:46,813 - TRAIN-LOGGER - INFO - Epoch 458 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.883987 weight_norm_u: 25.222990 loss: 0.968919 +RANK_0 - 2026-01-29 02:48:51,163 - TRAIN-LOGGER - INFO - Epoch 459 - TRAIN - Minibatch 0: weight_norm_model: 143.883987 loss: 0.968919 grad_norm_before_clip: 2.981204 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:52,314 - TRAIN-LOGGER - INFO - Epoch 459 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.883987 weight_norm_u: 25.218954 loss: 0.968919 grad_norm_before_clip: 2.981204 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:52,314 - TRAIN-LOGGER - INFO - Epoch 459 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884018 weight_norm_u: 25.222990 loss: 0.968318 +RANK_0 - 2026-01-29 02:48:56,902 - TRAIN-LOGGER - INFO - Epoch 460 - TRAIN - Minibatch 0: weight_norm_model: 143.884018 loss: 0.968318 grad_norm_before_clip: 3.590041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:58,037 - TRAIN-LOGGER - INFO - Epoch 460 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884018 weight_norm_u: 25.218954 loss: 0.968318 grad_norm_before_clip: 3.590041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:48:58,037 - TRAIN-LOGGER - INFO - Epoch 460 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884033 weight_norm_u: 25.222990 loss: 0.968314 +RANK_0 - 2026-01-29 02:49:02,715 - TRAIN-LOGGER - INFO - Epoch 461 - TRAIN - Minibatch 0: weight_norm_model: 143.884033 loss: 0.968314 grad_norm_before_clip: 4.222985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:03,942 - TRAIN-LOGGER - INFO - Epoch 461 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884033 weight_norm_u: 25.218954 loss: 0.968314 grad_norm_before_clip: 4.222985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:03,942 - TRAIN-LOGGER - INFO - Epoch 461 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884033 weight_norm_u: 25.222990 loss: 0.967196 +RANK_0 - 2026-01-29 02:49:08,315 - TRAIN-LOGGER - INFO - Epoch 462 - TRAIN - Minibatch 0: weight_norm_model: 143.884033 loss: 0.967196 grad_norm_before_clip: 4.339072 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:09,478 - TRAIN-LOGGER - INFO - Epoch 462 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884033 weight_norm_u: 25.218954 loss: 0.967196 grad_norm_before_clip: 4.339072 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:09,478 - TRAIN-LOGGER - INFO - Epoch 462 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884048 weight_norm_u: 25.222990 loss: 0.968227 +RANK_0 - 2026-01-29 02:49:14,005 - TRAIN-LOGGER - INFO - Epoch 463 - TRAIN - Minibatch 0: weight_norm_model: 143.884048 loss: 0.968227 grad_norm_before_clip: 3.622480 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:15,321 - TRAIN-LOGGER - INFO - Epoch 463 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884048 weight_norm_u: 25.218954 loss: 0.968227 grad_norm_before_clip: 3.622480 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:15,321 - TRAIN-LOGGER - INFO - Epoch 463 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884064 weight_norm_u: 25.222990 loss: 0.968899 +RANK_0 - 2026-01-29 02:49:19,718 - TRAIN-LOGGER - INFO - Epoch 464 - TRAIN - Minibatch 0: weight_norm_model: 143.884064 loss: 0.968899 grad_norm_before_clip: 5.163156 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:20,867 - TRAIN-LOGGER - INFO - Epoch 464 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884064 weight_norm_u: 25.218954 loss: 0.968899 grad_norm_before_clip: 5.163156 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:20,868 - TRAIN-LOGGER - INFO - Epoch 464 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884064 weight_norm_u: 25.222990 loss: 0.969654 +RANK_0 - 2026-01-29 02:49:25,371 - TRAIN-LOGGER - INFO - Epoch 465 - TRAIN - Minibatch 0: weight_norm_model: 143.884064 loss: 0.969654 grad_norm_before_clip: 5.020462 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:26,545 - TRAIN-LOGGER - INFO - Epoch 465 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884064 weight_norm_u: 25.218954 loss: 0.969654 grad_norm_before_clip: 5.020462 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:26,545 - TRAIN-LOGGER - INFO - Epoch 465 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884079 weight_norm_u: 25.222990 loss: 0.965662 +RANK_0 - 2026-01-29 02:49:31,324 - TRAIN-LOGGER - INFO - Epoch 466 - TRAIN - Minibatch 0: weight_norm_model: 143.884079 loss: 0.965662 grad_norm_before_clip: 1.198421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:32,512 - TRAIN-LOGGER - INFO - Epoch 466 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884079 weight_norm_u: 25.218954 loss: 0.965662 grad_norm_before_clip: 1.198421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:32,513 - TRAIN-LOGGER - INFO - Epoch 466 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884094 weight_norm_u: 25.222990 loss: 0.970578 +RANK_0 - 2026-01-29 02:49:37,216 - TRAIN-LOGGER - INFO - Epoch 467 - TRAIN - Minibatch 0: weight_norm_model: 143.884094 loss: 0.970578 grad_norm_before_clip: 6.867290 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:38,467 - TRAIN-LOGGER - INFO - Epoch 467 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884094 weight_norm_u: 25.218954 loss: 0.970578 grad_norm_before_clip: 6.867290 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:38,468 - TRAIN-LOGGER - INFO - Epoch 467 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884094 weight_norm_u: 25.222990 loss: 0.969409 +RANK_0 - 2026-01-29 02:49:42,967 - TRAIN-LOGGER - INFO - Epoch 468 - TRAIN - Minibatch 0: weight_norm_model: 143.884094 loss: 0.969409 grad_norm_before_clip: 6.218024 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:44,151 - TRAIN-LOGGER - INFO - Epoch 468 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884094 weight_norm_u: 25.218954 loss: 0.969409 grad_norm_before_clip: 6.218024 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:44,151 - TRAIN-LOGGER - INFO - Epoch 468 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884109 weight_norm_u: 25.222990 loss: 0.967777 +RANK_0 - 2026-01-29 02:49:49,815 - TRAIN-LOGGER - INFO - Epoch 469 - TRAIN - Minibatch 0: weight_norm_model: 143.884109 loss: 0.967777 grad_norm_before_clip: 1.717936 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:51,040 - TRAIN-LOGGER - INFO - Epoch 469 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884109 weight_norm_u: 25.218954 loss: 0.967777 grad_norm_before_clip: 1.717936 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:51,040 - TRAIN-LOGGER - INFO - Epoch 469 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884109 weight_norm_u: 25.222990 loss: 0.968215 +RANK_0 - 2026-01-29 02:49:56,047 - TRAIN-LOGGER - INFO - Epoch 470 - TRAIN - Minibatch 0: weight_norm_model: 143.884109 loss: 0.968215 grad_norm_before_clip: 1.639461 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:57,247 - TRAIN-LOGGER - INFO - Epoch 470 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884109 weight_norm_u: 25.218954 loss: 0.968215 grad_norm_before_clip: 1.639461 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:49:57,247 - TRAIN-LOGGER - INFO - Epoch 470 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884109 weight_norm_u: 25.222990 loss: 0.968468 +RANK_0 - 2026-01-29 02:50:02,527 - TRAIN-LOGGER - INFO - Epoch 471 - TRAIN - Minibatch 0: weight_norm_model: 143.884109 loss: 0.968468 grad_norm_before_clip: 2.697631 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:03,785 - TRAIN-LOGGER - INFO - Epoch 471 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884109 weight_norm_u: 25.218954 loss: 0.968468 grad_norm_before_clip: 2.697631 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:03,785 - TRAIN-LOGGER - INFO - Epoch 471 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884109 weight_norm_u: 25.222990 loss: 0.966095 +RANK_0 - 2026-01-29 02:50:08,557 - TRAIN-LOGGER - INFO - Epoch 472 - TRAIN - Minibatch 0: weight_norm_model: 143.884109 loss: 0.966095 grad_norm_before_clip: 4.139463 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:09,719 - TRAIN-LOGGER - INFO - Epoch 472 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884109 weight_norm_u: 25.218954 loss: 0.966095 grad_norm_before_clip: 4.139463 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:09,720 - TRAIN-LOGGER - INFO - Epoch 472 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884125 weight_norm_u: 25.222990 loss: 0.967014 +RANK_0 - 2026-01-29 02:50:15,006 - TRAIN-LOGGER - INFO - Epoch 473 - TRAIN - Minibatch 0: weight_norm_model: 143.884125 loss: 0.967014 grad_norm_before_clip: 4.108366 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:16,279 - TRAIN-LOGGER - INFO - Epoch 473 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884125 weight_norm_u: 25.218954 loss: 0.967014 grad_norm_before_clip: 4.108366 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:16,279 - TRAIN-LOGGER - INFO - Epoch 473 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884125 weight_norm_u: 25.222990 loss: 0.968725 +RANK_0 - 2026-01-29 02:50:20,599 - TRAIN-LOGGER - INFO - Epoch 474 - TRAIN - Minibatch 0: weight_norm_model: 143.884125 loss: 0.968725 grad_norm_before_clip: 3.810528 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:21,858 - TRAIN-LOGGER - INFO - Epoch 474 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884125 weight_norm_u: 25.218954 loss: 0.968725 grad_norm_before_clip: 3.810528 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:21,859 - TRAIN-LOGGER - INFO - Epoch 474 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884140 weight_norm_u: 25.222990 loss: 0.968297 +RANK_0 - 2026-01-29 02:50:26,653 - TRAIN-LOGGER - INFO - Epoch 475 - TRAIN - Minibatch 0: weight_norm_model: 143.884140 loss: 0.968297 grad_norm_before_clip: 3.335962 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:27,899 - TRAIN-LOGGER - INFO - Epoch 475 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884140 weight_norm_u: 25.218954 loss: 0.968297 grad_norm_before_clip: 3.335962 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:27,899 - TRAIN-LOGGER - INFO - Epoch 475 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884140 weight_norm_u: 25.222990 loss: 0.966450 +RANK_0 - 2026-01-29 02:50:31,994 - TRAIN-LOGGER - INFO - Epoch 476 - TRAIN - Minibatch 0: weight_norm_model: 143.884140 loss: 0.966450 grad_norm_before_clip: 3.005776 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:33,142 - TRAIN-LOGGER - INFO - Epoch 476 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884140 weight_norm_u: 25.218954 loss: 0.966450 grad_norm_before_clip: 3.005776 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:33,142 - TRAIN-LOGGER - INFO - Epoch 476 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884155 weight_norm_u: 25.222990 loss: 0.967273 +RANK_0 - 2026-01-29 02:50:38,134 - TRAIN-LOGGER - INFO - Epoch 477 - TRAIN - Minibatch 0: weight_norm_model: 143.884155 loss: 0.967273 grad_norm_before_clip: 4.941348 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:39,308 - TRAIN-LOGGER - INFO - Epoch 477 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884155 weight_norm_u: 25.218954 loss: 0.967273 grad_norm_before_clip: 4.941348 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:39,308 - TRAIN-LOGGER - INFO - Epoch 477 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884171 weight_norm_u: 25.222990 loss: 0.969042 +RANK_0 - 2026-01-29 02:50:43,597 - TRAIN-LOGGER - INFO - Epoch 478 - TRAIN - Minibatch 0: weight_norm_model: 143.884171 loss: 0.969042 grad_norm_before_clip: 2.774868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:44,742 - TRAIN-LOGGER - INFO - Epoch 478 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884171 weight_norm_u: 25.218954 loss: 0.969042 grad_norm_before_clip: 2.774868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:44,742 - TRAIN-LOGGER - INFO - Epoch 478 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884186 weight_norm_u: 25.222990 loss: 0.967771 +RANK_0 - 2026-01-29 02:50:49,393 - TRAIN-LOGGER - INFO - Epoch 479 - TRAIN - Minibatch 0: weight_norm_model: 143.884186 loss: 0.967771 grad_norm_before_clip: 2.601717 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:50,631 - TRAIN-LOGGER - INFO - Epoch 479 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884186 weight_norm_u: 25.218954 loss: 0.967771 grad_norm_before_clip: 2.601717 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:50,632 - TRAIN-LOGGER - INFO - Epoch 479 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884186 weight_norm_u: 25.222990 loss: 0.965999 +RANK_0 - 2026-01-29 02:50:54,865 - TRAIN-LOGGER - INFO - Epoch 480 - TRAIN - Minibatch 0: weight_norm_model: 143.884186 loss: 0.965999 grad_norm_before_clip: 3.009996 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:56,437 - TRAIN-LOGGER - INFO - Epoch 480 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884186 weight_norm_u: 25.218954 loss: 0.965999 grad_norm_before_clip: 3.009996 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:50:56,437 - TRAIN-LOGGER - INFO - Epoch 480 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884201 weight_norm_u: 25.222990 loss: 0.966846 +RANK_0 - 2026-01-29 02:51:01,008 - TRAIN-LOGGER - INFO - Epoch 481 - TRAIN - Minibatch 0: weight_norm_model: 143.884201 loss: 0.966846 grad_norm_before_clip: 3.351151 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:02,162 - TRAIN-LOGGER - INFO - Epoch 481 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884201 weight_norm_u: 25.218954 loss: 0.966846 grad_norm_before_clip: 3.351151 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:02,162 - TRAIN-LOGGER - INFO - Epoch 481 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884201 weight_norm_u: 25.222990 loss: 0.967181 +RANK_0 - 2026-01-29 02:51:08,038 - TRAIN-LOGGER - INFO - Epoch 482 - TRAIN - Minibatch 0: weight_norm_model: 143.884201 loss: 0.967181 grad_norm_before_clip: 4.652812 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:09,307 - TRAIN-LOGGER - INFO - Epoch 482 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884201 weight_norm_u: 25.218954 loss: 0.967181 grad_norm_before_clip: 4.652812 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:09,308 - TRAIN-LOGGER - INFO - Epoch 482 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884216 weight_norm_u: 25.222990 loss: 0.965104 +RANK_0 - 2026-01-29 02:51:14,377 - TRAIN-LOGGER - INFO - Epoch 483 - TRAIN - Minibatch 0: weight_norm_model: 143.884216 loss: 0.965104 grad_norm_before_clip: 2.851196 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:15,878 - TRAIN-LOGGER - INFO - Epoch 483 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884216 weight_norm_u: 25.218954 loss: 0.965104 grad_norm_before_clip: 2.851196 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:15,878 - TRAIN-LOGGER - INFO - Epoch 483 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884247 weight_norm_u: 25.222990 loss: 0.969043 +RANK_0 - 2026-01-29 02:51:20,190 - TRAIN-LOGGER - INFO - Epoch 484 - TRAIN - Minibatch 0: weight_norm_model: 143.884247 loss: 0.969043 grad_norm_before_clip: 5.209727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:21,340 - TRAIN-LOGGER - INFO - Epoch 484 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884247 weight_norm_u: 25.218954 loss: 0.969043 grad_norm_before_clip: 5.209727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:21,340 - TRAIN-LOGGER - INFO - Epoch 484 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884262 weight_norm_u: 25.222990 loss: 0.970092 +RANK_0 - 2026-01-29 02:51:27,080 - TRAIN-LOGGER - INFO - Epoch 485 - TRAIN - Minibatch 0: weight_norm_model: 143.884262 loss: 0.970092 grad_norm_before_clip: 5.433434 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:28,236 - TRAIN-LOGGER - INFO - Epoch 485 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884262 weight_norm_u: 25.218954 loss: 0.970092 grad_norm_before_clip: 5.433434 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:28,237 - TRAIN-LOGGER - INFO - Epoch 485 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884277 weight_norm_u: 25.222990 loss: 0.968603 +RANK_0 - 2026-01-29 02:51:32,711 - TRAIN-LOGGER - INFO - Epoch 486 - TRAIN - Minibatch 0: weight_norm_model: 143.884277 loss: 0.968603 grad_norm_before_clip: 2.665214 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:33,879 - TRAIN-LOGGER - INFO - Epoch 486 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884277 weight_norm_u: 25.218954 loss: 0.968603 grad_norm_before_clip: 2.665214 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:33,879 - TRAIN-LOGGER - INFO - Epoch 486 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884277 weight_norm_u: 25.222990 loss: 0.965721 +RANK_0 - 2026-01-29 02:51:38,534 - TRAIN-LOGGER - INFO - Epoch 487 - TRAIN - Minibatch 0: weight_norm_model: 143.884277 loss: 0.965721 grad_norm_before_clip: 2.281358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:39,758 - TRAIN-LOGGER - INFO - Epoch 487 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884277 weight_norm_u: 25.218954 loss: 0.965721 grad_norm_before_clip: 2.281358 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:39,759 - TRAIN-LOGGER - INFO - Epoch 487 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884277 weight_norm_u: 25.222990 loss: 0.966746 +RANK_0 - 2026-01-29 02:51:43,847 - TRAIN-LOGGER - INFO - Epoch 488 - TRAIN - Minibatch 0: weight_norm_model: 143.884277 loss: 0.966746 grad_norm_before_clip: 3.796048 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:45,019 - TRAIN-LOGGER - INFO - Epoch 488 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884277 weight_norm_u: 25.218954 loss: 0.966746 grad_norm_before_clip: 3.796048 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:45,020 - TRAIN-LOGGER - INFO - Epoch 488 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884277 weight_norm_u: 25.222990 loss: 0.968157 +RANK_0 - 2026-01-29 02:51:50,069 - TRAIN-LOGGER - INFO - Epoch 489 - TRAIN - Minibatch 0: weight_norm_model: 143.884277 loss: 0.968157 grad_norm_before_clip: 3.698536 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:51,299 - TRAIN-LOGGER - INFO - Epoch 489 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884277 weight_norm_u: 25.218954 loss: 0.968157 grad_norm_before_clip: 3.698536 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:51,299 - TRAIN-LOGGER - INFO - Epoch 489 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884293 weight_norm_u: 25.222990 loss: 0.966632 +RANK_0 - 2026-01-29 02:51:55,776 - TRAIN-LOGGER - INFO - Epoch 490 - TRAIN - Minibatch 0: weight_norm_model: 143.884293 loss: 0.966632 grad_norm_before_clip: 2.925557 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:56,916 - TRAIN-LOGGER - INFO - Epoch 490 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884293 weight_norm_u: 25.218954 loss: 0.966632 grad_norm_before_clip: 2.925557 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:51:56,916 - TRAIN-LOGGER - INFO - Epoch 490 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884308 weight_norm_u: 25.222990 loss: 0.966583 +RANK_0 - 2026-01-29 02:52:01,771 - TRAIN-LOGGER - INFO - Epoch 491 - TRAIN - Minibatch 0: weight_norm_model: 143.884308 loss: 0.966583 grad_norm_before_clip: 4.252655 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:03,017 - TRAIN-LOGGER - INFO - Epoch 491 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884308 weight_norm_u: 25.218954 loss: 0.966583 grad_norm_before_clip: 4.252655 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:03,017 - TRAIN-LOGGER - INFO - Epoch 491 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884323 weight_norm_u: 25.222990 loss: 0.968253 +RANK_0 - 2026-01-29 02:52:07,991 - TRAIN-LOGGER - INFO - Epoch 492 - TRAIN - Minibatch 0: weight_norm_model: 143.884323 loss: 0.968253 grad_norm_before_clip: 3.596443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:09,237 - TRAIN-LOGGER - INFO - Epoch 492 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884323 weight_norm_u: 25.218954 loss: 0.968253 grad_norm_before_clip: 3.596443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:09,237 - TRAIN-LOGGER - INFO - Epoch 492 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884338 weight_norm_u: 25.222990 loss: 0.965870 +RANK_0 - 2026-01-29 02:52:14,182 - TRAIN-LOGGER - INFO - Epoch 493 - TRAIN - Minibatch 0: weight_norm_model: 143.884338 loss: 0.965870 grad_norm_before_clip: 2.169584 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:15,339 - TRAIN-LOGGER - INFO - Epoch 493 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884338 weight_norm_u: 25.218954 loss: 0.965870 grad_norm_before_clip: 2.169584 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:15,339 - TRAIN-LOGGER - INFO - Epoch 493 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884354 weight_norm_u: 25.222990 loss: 0.966287 +RANK_0 - 2026-01-29 02:52:19,955 - TRAIN-LOGGER - INFO - Epoch 494 - TRAIN - Minibatch 0: weight_norm_model: 143.884354 loss: 0.966287 grad_norm_before_clip: 3.480747 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:21,284 - TRAIN-LOGGER - INFO - Epoch 494 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884354 weight_norm_u: 25.218954 loss: 0.966287 grad_norm_before_clip: 3.480747 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:21,285 - TRAIN-LOGGER - INFO - Epoch 494 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884354 weight_norm_u: 25.222990 loss: 0.966938 +RANK_0 - 2026-01-29 02:52:26,015 - TRAIN-LOGGER - INFO - Epoch 495 - TRAIN - Minibatch 0: weight_norm_model: 143.884354 loss: 0.966938 grad_norm_before_clip: 4.755659 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:27,308 - TRAIN-LOGGER - INFO - Epoch 495 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884354 weight_norm_u: 25.218954 loss: 0.966938 grad_norm_before_clip: 4.755659 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:27,308 - TRAIN-LOGGER - INFO - Epoch 495 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884354 weight_norm_u: 25.222990 loss: 0.966574 +RANK_0 - 2026-01-29 02:52:32,087 - TRAIN-LOGGER - INFO - Epoch 496 - TRAIN - Minibatch 0: weight_norm_model: 143.884354 loss: 0.966574 grad_norm_before_clip: 3.413510 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:33,485 - TRAIN-LOGGER - INFO - Epoch 496 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884354 weight_norm_u: 25.218954 loss: 0.966574 grad_norm_before_clip: 3.413510 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:33,485 - TRAIN-LOGGER - INFO - Epoch 496 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884354 weight_norm_u: 25.222990 loss: 0.967943 +RANK_0 - 2026-01-29 02:52:38,024 - TRAIN-LOGGER - INFO - Epoch 497 - TRAIN - Minibatch 0: weight_norm_model: 143.884354 loss: 0.967943 grad_norm_before_clip: 4.565260 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:39,197 - TRAIN-LOGGER - INFO - Epoch 497 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884354 weight_norm_u: 25.218954 loss: 0.967943 grad_norm_before_clip: 4.565260 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:39,197 - TRAIN-LOGGER - INFO - Epoch 497 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884369 weight_norm_u: 25.222990 loss: 0.967547 +RANK_0 - 2026-01-29 02:52:44,512 - TRAIN-LOGGER - INFO - Epoch 498 - TRAIN - Minibatch 0: weight_norm_model: 143.884369 loss: 0.967547 grad_norm_before_clip: 5.176290 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:45,769 - TRAIN-LOGGER - INFO - Epoch 498 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884369 weight_norm_u: 25.218954 loss: 0.967547 grad_norm_before_clip: 5.176290 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:45,770 - TRAIN-LOGGER - INFO - Epoch 498 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884384 weight_norm_u: 25.222990 loss: 0.965442 +RANK_0 - 2026-01-29 02:52:50,136 - TRAIN-LOGGER - INFO - Epoch 499 - TRAIN - Minibatch 0: weight_norm_model: 143.884384 loss: 0.965442 grad_norm_before_clip: 2.654788 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:51,313 - TRAIN-LOGGER - INFO - Epoch 499 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884384 weight_norm_u: 25.218954 loss: 0.965442 grad_norm_before_clip: 2.654788 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:51,314 - TRAIN-LOGGER - INFO - Epoch 499 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884384 weight_norm_u: 25.222990 loss: 0.965269 +RANK_0 - 2026-01-29 02:52:56,035 - TRAIN-LOGGER - INFO - Epoch 500 - TRAIN - Minibatch 0: weight_norm_model: 143.884384 loss: 0.965269 grad_norm_before_clip: 2.281070 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:57,364 - TRAIN-LOGGER - INFO - Epoch 500 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884384 weight_norm_u: 25.218954 loss: 0.965269 grad_norm_before_clip: 2.281070 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:52:57,364 - TRAIN-LOGGER - INFO - Epoch 500 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.968872 +RANK_0 - 2026-01-29 02:53:02,051 - TRAIN-LOGGER - INFO - Epoch 501 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.968872 grad_norm_before_clip: 4.208962 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:03,296 - TRAIN-LOGGER - INFO - Epoch 501 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.968872 grad_norm_before_clip: 4.208962 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:03,296 - TRAIN-LOGGER - INFO - Epoch 501 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.969074 +RANK_0 - 2026-01-29 02:53:08,325 - TRAIN-LOGGER - INFO - Epoch 502 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.969074 grad_norm_before_clip: 4.012725 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:09,467 - TRAIN-LOGGER - INFO - Epoch 502 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.969074 grad_norm_before_clip: 4.012725 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:09,467 - TRAIN-LOGGER - INFO - Epoch 502 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.965448 +RANK_0 - 2026-01-29 02:53:13,925 - TRAIN-LOGGER - INFO - Epoch 503 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.965448 grad_norm_before_clip: 2.546676 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:15,163 - TRAIN-LOGGER - INFO - Epoch 503 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.965448 grad_norm_before_clip: 2.546676 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:15,163 - TRAIN-LOGGER - INFO - Epoch 503 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.972831 +RANK_0 - 2026-01-29 02:53:20,361 - TRAIN-LOGGER - INFO - Epoch 504 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.972831 grad_norm_before_clip: 7.095038 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:21,632 - TRAIN-LOGGER - INFO - Epoch 504 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.972831 grad_norm_before_clip: 7.095038 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:21,632 - TRAIN-LOGGER - INFO - Epoch 504 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.976621 +RANK_0 - 2026-01-29 02:53:26,237 - TRAIN-LOGGER - INFO - Epoch 505 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.976621 grad_norm_before_clip: 7.970500 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:27,437 - TRAIN-LOGGER - INFO - Epoch 505 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.976621 grad_norm_before_clip: 7.970500 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:27,437 - TRAIN-LOGGER - INFO - Epoch 505 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.973021 +RANK_0 - 2026-01-29 02:53:31,746 - TRAIN-LOGGER - INFO - Epoch 506 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.973021 grad_norm_before_clip: 5.328810 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:33,147 - TRAIN-LOGGER - INFO - Epoch 506 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.973021 grad_norm_before_clip: 5.328810 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:33,147 - TRAIN-LOGGER - INFO - Epoch 506 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884430 weight_norm_u: 25.222990 loss: 0.970907 +RANK_0 - 2026-01-29 02:53:38,081 - TRAIN-LOGGER - INFO - Epoch 507 - TRAIN - Minibatch 0: weight_norm_model: 143.884430 loss: 0.970907 grad_norm_before_clip: 3.722515 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:39,414 - TRAIN-LOGGER - INFO - Epoch 507 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884430 weight_norm_u: 25.218954 loss: 0.970907 grad_norm_before_clip: 3.722515 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:39,415 - TRAIN-LOGGER - INFO - Epoch 507 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884445 weight_norm_u: 25.222990 loss: 0.971149 +RANK_0 - 2026-01-29 02:53:44,019 - TRAIN-LOGGER - INFO - Epoch 508 - TRAIN - Minibatch 0: weight_norm_model: 143.884445 loss: 0.971149 grad_norm_before_clip: 5.074970 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:45,462 - TRAIN-LOGGER - INFO - Epoch 508 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884445 weight_norm_u: 25.218954 loss: 0.971149 grad_norm_before_clip: 5.074970 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:45,462 - TRAIN-LOGGER - INFO - Epoch 508 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884445 weight_norm_u: 25.222990 loss: 0.973791 +RANK_0 - 2026-01-29 02:53:49,804 - TRAIN-LOGGER - INFO - Epoch 509 - TRAIN - Minibatch 0: weight_norm_model: 143.884445 loss: 0.973791 grad_norm_before_clip: 5.525651 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:51,031 - TRAIN-LOGGER - INFO - Epoch 509 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884445 weight_norm_u: 25.218954 loss: 0.973791 grad_norm_before_clip: 5.525651 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:51,031 - TRAIN-LOGGER - INFO - Epoch 509 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884445 weight_norm_u: 25.222990 loss: 0.971808 +RANK_0 - 2026-01-29 02:53:55,315 - TRAIN-LOGGER - INFO - Epoch 510 - TRAIN - Minibatch 0: weight_norm_model: 143.884445 loss: 0.971808 grad_norm_before_clip: 4.924091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:56,877 - TRAIN-LOGGER - INFO - Epoch 510 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884445 weight_norm_u: 25.218954 loss: 0.971808 grad_norm_before_clip: 4.924091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:53:56,877 - TRAIN-LOGGER - INFO - Epoch 510 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884430 weight_norm_u: 25.222990 loss: 0.967100 +RANK_0 - 2026-01-29 02:54:01,006 - TRAIN-LOGGER - INFO - Epoch 511 - TRAIN - Minibatch 0: weight_norm_model: 143.884430 loss: 0.967100 grad_norm_before_clip: 2.626322 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:02,144 - TRAIN-LOGGER - INFO - Epoch 511 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884430 weight_norm_u: 25.218954 loss: 0.967100 grad_norm_before_clip: 2.626322 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:02,144 - TRAIN-LOGGER - INFO - Epoch 511 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.970586 +RANK_0 - 2026-01-29 02:54:07,305 - TRAIN-LOGGER - INFO - Epoch 512 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.970586 grad_norm_before_clip: 6.091989 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:08,538 - TRAIN-LOGGER - INFO - Epoch 512 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.970586 grad_norm_before_clip: 6.091989 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:08,538 - TRAIN-LOGGER - INFO - Epoch 512 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884415 weight_norm_u: 25.222990 loss: 0.972857 +RANK_0 - 2026-01-29 02:54:13,587 - TRAIN-LOGGER - INFO - Epoch 513 - TRAIN - Minibatch 0: weight_norm_model: 143.884415 loss: 0.972857 grad_norm_before_clip: 6.626473 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:14,899 - TRAIN-LOGGER - INFO - Epoch 513 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884415 weight_norm_u: 25.218954 loss: 0.972857 grad_norm_before_clip: 6.626473 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:14,899 - TRAIN-LOGGER - INFO - Epoch 513 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884430 weight_norm_u: 25.222990 loss: 0.970152 +RANK_0 - 2026-01-29 02:54:19,655 - TRAIN-LOGGER - INFO - Epoch 514 - TRAIN - Minibatch 0: weight_norm_model: 143.884430 loss: 0.970152 grad_norm_before_clip: 4.430711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:20,887 - TRAIN-LOGGER - INFO - Epoch 514 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884430 weight_norm_u: 25.218954 loss: 0.970152 grad_norm_before_clip: 4.430711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:20,888 - TRAIN-LOGGER - INFO - Epoch 514 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884445 weight_norm_u: 25.222990 loss: 0.966754 +RANK_0 - 2026-01-29 02:54:25,940 - TRAIN-LOGGER - INFO - Epoch 515 - TRAIN - Minibatch 0: weight_norm_model: 143.884445 loss: 0.966754 grad_norm_before_clip: 1.803872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:27,096 - TRAIN-LOGGER - INFO - Epoch 515 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884445 weight_norm_u: 25.218954 loss: 0.966754 grad_norm_before_clip: 1.803872 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:27,096 - TRAIN-LOGGER - INFO - Epoch 515 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884491 weight_norm_u: 25.222990 loss: 0.968961 +RANK_0 - 2026-01-29 02:54:31,370 - TRAIN-LOGGER - INFO - Epoch 516 - TRAIN - Minibatch 0: weight_norm_model: 143.884491 loss: 0.968961 grad_norm_before_clip: 3.510994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:32,645 - TRAIN-LOGGER - INFO - Epoch 516 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884491 weight_norm_u: 25.218954 loss: 0.968961 grad_norm_before_clip: 3.510994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:32,646 - TRAIN-LOGGER - INFO - Epoch 516 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884506 weight_norm_u: 25.222990 loss: 0.970270 +RANK_0 - 2026-01-29 02:54:37,525 - TRAIN-LOGGER - INFO - Epoch 517 - TRAIN - Minibatch 0: weight_norm_model: 143.884506 loss: 0.970270 grad_norm_before_clip: 4.209049 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:38,738 - TRAIN-LOGGER - INFO - Epoch 517 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884506 weight_norm_u: 25.218954 loss: 0.970270 grad_norm_before_clip: 4.209049 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:38,739 - TRAIN-LOGGER - INFO - Epoch 517 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884506 weight_norm_u: 25.222990 loss: 0.968401 +RANK_0 - 2026-01-29 02:54:43,009 - TRAIN-LOGGER - INFO - Epoch 518 - TRAIN - Minibatch 0: weight_norm_model: 143.884506 loss: 0.968401 grad_norm_before_clip: 2.672274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:44,257 - TRAIN-LOGGER - INFO - Epoch 518 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884506 weight_norm_u: 25.218954 loss: 0.968401 grad_norm_before_clip: 2.672274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:44,257 - TRAIN-LOGGER - INFO - Epoch 518 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884506 weight_norm_u: 25.222990 loss: 0.969819 +RANK_0 - 2026-01-29 02:54:49,192 - TRAIN-LOGGER - INFO - Epoch 519 - TRAIN - Minibatch 0: weight_norm_model: 143.884506 loss: 0.969819 grad_norm_before_clip: 3.646050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:50,543 - TRAIN-LOGGER - INFO - Epoch 519 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884506 weight_norm_u: 25.218954 loss: 0.969819 grad_norm_before_clip: 3.646050 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:50,543 - TRAIN-LOGGER - INFO - Epoch 519 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884506 weight_norm_u: 25.222990 loss: 0.971745 +RANK_0 - 2026-01-29 02:54:54,847 - TRAIN-LOGGER - INFO - Epoch 520 - TRAIN - Minibatch 0: weight_norm_model: 143.884506 loss: 0.971745 grad_norm_before_clip: 5.035012 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:55,991 - TRAIN-LOGGER - INFO - Epoch 520 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884506 weight_norm_u: 25.218954 loss: 0.971745 grad_norm_before_clip: 5.035012 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:54:55,991 - TRAIN-LOGGER - INFO - Epoch 520 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884506 weight_norm_u: 25.222990 loss: 0.969219 +RANK_0 - 2026-01-29 02:55:00,911 - TRAIN-LOGGER - INFO - Epoch 521 - TRAIN - Minibatch 0: weight_norm_model: 143.884506 loss: 0.969219 grad_norm_before_clip: 5.445171 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:02,069 - TRAIN-LOGGER - INFO - Epoch 521 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884506 weight_norm_u: 25.218954 loss: 0.969219 grad_norm_before_clip: 5.445171 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:02,069 - TRAIN-LOGGER - INFO - Epoch 521 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884521 weight_norm_u: 25.222990 loss: 0.968195 +RANK_0 - 2026-01-29 02:55:07,021 - TRAIN-LOGGER - INFO - Epoch 522 - TRAIN - Minibatch 0: weight_norm_model: 143.884521 loss: 0.968195 grad_norm_before_clip: 4.782985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:08,222 - TRAIN-LOGGER - INFO - Epoch 522 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884521 weight_norm_u: 25.218954 loss: 0.968195 grad_norm_before_clip: 4.782985 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:08,223 - TRAIN-LOGGER - INFO - Epoch 522 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884537 weight_norm_u: 25.222990 loss: 0.968651 +RANK_0 - 2026-01-29 02:55:12,897 - TRAIN-LOGGER - INFO - Epoch 523 - TRAIN - Minibatch 0: weight_norm_model: 143.884537 loss: 0.968651 grad_norm_before_clip: 4.901904 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:14,074 - TRAIN-LOGGER - INFO - Epoch 523 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884537 weight_norm_u: 25.218954 loss: 0.968651 grad_norm_before_clip: 4.901904 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:14,074 - TRAIN-LOGGER - INFO - Epoch 523 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884537 weight_norm_u: 25.222990 loss: 0.966825 +RANK_0 - 2026-01-29 02:55:18,740 - TRAIN-LOGGER - INFO - Epoch 524 - TRAIN - Minibatch 0: weight_norm_model: 143.884537 loss: 0.966825 grad_norm_before_clip: 2.692423 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:20,124 - TRAIN-LOGGER - INFO - Epoch 524 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884537 weight_norm_u: 25.218954 loss: 0.966825 grad_norm_before_clip: 2.692423 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:20,125 - TRAIN-LOGGER - INFO - Epoch 524 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884537 weight_norm_u: 25.222990 loss: 0.966101 +RANK_0 - 2026-01-29 02:55:24,727 - TRAIN-LOGGER - INFO - Epoch 525 - TRAIN - Minibatch 0: weight_norm_model: 143.884537 loss: 0.966101 grad_norm_before_clip: 1.352556 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:25,971 - TRAIN-LOGGER - INFO - Epoch 525 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884537 weight_norm_u: 25.218954 loss: 0.966101 grad_norm_before_clip: 1.352556 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:25,971 - TRAIN-LOGGER - INFO - Epoch 525 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884537 weight_norm_u: 25.222990 loss: 0.965729 +RANK_0 - 2026-01-29 02:55:30,494 - TRAIN-LOGGER - INFO - Epoch 526 - TRAIN - Minibatch 0: weight_norm_model: 143.884537 loss: 0.965729 grad_norm_before_clip: 1.558308 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:31,626 - TRAIN-LOGGER - INFO - Epoch 526 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884537 weight_norm_u: 25.218954 loss: 0.965729 grad_norm_before_clip: 1.558308 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:31,626 - TRAIN-LOGGER - INFO - Epoch 526 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884537 weight_norm_u: 25.222990 loss: 0.966850 +RANK_0 - 2026-01-29 02:55:35,891 - TRAIN-LOGGER - INFO - Epoch 527 - TRAIN - Minibatch 0: weight_norm_model: 143.884537 loss: 0.966850 grad_norm_before_clip: 2.719628 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:37,021 - TRAIN-LOGGER - INFO - Epoch 527 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884537 weight_norm_u: 25.218954 loss: 0.966850 grad_norm_before_clip: 2.719628 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:37,022 - TRAIN-LOGGER - INFO - Epoch 527 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884552 weight_norm_u: 25.222990 loss: 0.967357 +RANK_0 - 2026-01-29 02:55:41,299 - TRAIN-LOGGER - INFO - Epoch 528 - TRAIN - Minibatch 0: weight_norm_model: 143.884552 loss: 0.967357 grad_norm_before_clip: 2.915319 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:42,482 - TRAIN-LOGGER - INFO - Epoch 528 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884552 weight_norm_u: 25.218954 loss: 0.967357 grad_norm_before_clip: 2.915319 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:42,482 - TRAIN-LOGGER - INFO - Epoch 528 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884583 weight_norm_u: 25.222990 loss: 0.965200 +RANK_0 - 2026-01-29 02:55:47,021 - TRAIN-LOGGER - INFO - Epoch 529 - TRAIN - Minibatch 0: weight_norm_model: 143.884583 loss: 0.965200 grad_norm_before_clip: 2.782871 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:48,258 - TRAIN-LOGGER - INFO - Epoch 529 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884583 weight_norm_u: 25.218954 loss: 0.965200 grad_norm_before_clip: 2.782871 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:48,258 - TRAIN-LOGGER - INFO - Epoch 529 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884583 weight_norm_u: 25.222990 loss: 0.967640 +RANK_0 - 2026-01-29 02:55:52,513 - TRAIN-LOGGER - INFO - Epoch 530 - TRAIN - Minibatch 0: weight_norm_model: 143.884583 loss: 0.967640 grad_norm_before_clip: 4.784361 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:53,694 - TRAIN-LOGGER - INFO - Epoch 530 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884583 weight_norm_u: 25.218954 loss: 0.967640 grad_norm_before_clip: 4.784361 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:53,695 - TRAIN-LOGGER - INFO - Epoch 530 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884583 weight_norm_u: 25.222990 loss: 0.969558 +RANK_0 - 2026-01-29 02:55:58,684 - TRAIN-LOGGER - INFO - Epoch 531 - TRAIN - Minibatch 0: weight_norm_model: 143.884583 loss: 0.969558 grad_norm_before_clip: 4.158884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:59,871 - TRAIN-LOGGER - INFO - Epoch 531 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884583 weight_norm_u: 25.218954 loss: 0.969558 grad_norm_before_clip: 4.158884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:55:59,871 - TRAIN-LOGGER - INFO - Epoch 531 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884598 weight_norm_u: 25.222990 loss: 0.969417 +RANK_0 - 2026-01-29 02:56:04,633 - TRAIN-LOGGER - INFO - Epoch 532 - TRAIN - Minibatch 0: weight_norm_model: 143.884598 loss: 0.969417 grad_norm_before_clip: 3.422467 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:05,806 - TRAIN-LOGGER - INFO - Epoch 532 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884598 weight_norm_u: 25.218954 loss: 0.969417 grad_norm_before_clip: 3.422467 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:05,806 - TRAIN-LOGGER - INFO - Epoch 532 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884598 weight_norm_u: 25.222990 loss: 0.968463 +RANK_0 - 2026-01-29 02:56:11,230 - TRAIN-LOGGER - INFO - Epoch 533 - TRAIN - Minibatch 0: weight_norm_model: 143.884598 loss: 0.968463 grad_norm_before_clip: 4.216517 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:12,447 - TRAIN-LOGGER - INFO - Epoch 533 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884598 weight_norm_u: 25.218954 loss: 0.968463 grad_norm_before_clip: 4.216517 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:12,447 - TRAIN-LOGGER - INFO - Epoch 533 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884613 weight_norm_u: 25.222990 loss: 0.967065 +RANK_0 - 2026-01-29 02:56:17,509 - TRAIN-LOGGER - INFO - Epoch 534 - TRAIN - Minibatch 0: weight_norm_model: 143.884613 loss: 0.967065 grad_norm_before_clip: 3.949319 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:18,712 - TRAIN-LOGGER - INFO - Epoch 534 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884613 weight_norm_u: 25.218954 loss: 0.967065 grad_norm_before_clip: 3.949319 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:18,713 - TRAIN-LOGGER - INFO - Epoch 534 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884628 weight_norm_u: 25.222990 loss: 0.964748 +RANK_0 - 2026-01-29 02:56:24,502 - TRAIN-LOGGER - INFO - Epoch 535 - TRAIN - Minibatch 0: weight_norm_model: 143.884628 loss: 0.964748 grad_norm_before_clip: 2.262285 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:25,676 - TRAIN-LOGGER - INFO - Epoch 535 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884628 weight_norm_u: 25.218954 loss: 0.964748 grad_norm_before_clip: 2.262285 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:25,676 - TRAIN-LOGGER - INFO - Epoch 535 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884644 weight_norm_u: 25.222990 loss: 0.967783 +RANK_0 - 2026-01-29 02:56:30,397 - TRAIN-LOGGER - INFO - Epoch 536 - TRAIN - Minibatch 0: weight_norm_model: 143.884644 loss: 0.967783 grad_norm_before_clip: 5.066208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:31,508 - TRAIN-LOGGER - INFO - Epoch 536 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884644 weight_norm_u: 25.218954 loss: 0.967783 grad_norm_before_clip: 5.066208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:31,508 - TRAIN-LOGGER - INFO - Epoch 536 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884644 weight_norm_u: 25.222990 loss: 0.966130 +RANK_0 - 2026-01-29 02:56:36,430 - TRAIN-LOGGER - INFO - Epoch 537 - TRAIN - Minibatch 0: weight_norm_model: 143.884644 loss: 0.966130 grad_norm_before_clip: 3.337029 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:37,585 - TRAIN-LOGGER - INFO - Epoch 537 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884644 weight_norm_u: 25.218954 loss: 0.966130 grad_norm_before_clip: 3.337029 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:37,586 - TRAIN-LOGGER - INFO - Epoch 537 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884644 weight_norm_u: 25.222990 loss: 0.965066 +RANK_0 - 2026-01-29 02:56:42,295 - TRAIN-LOGGER - INFO - Epoch 538 - TRAIN - Minibatch 0: weight_norm_model: 143.884644 loss: 0.965066 grad_norm_before_clip: 2.582021 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:43,442 - TRAIN-LOGGER - INFO - Epoch 538 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884644 weight_norm_u: 25.218954 loss: 0.965066 grad_norm_before_clip: 2.582021 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:43,442 - TRAIN-LOGGER - INFO - Epoch 538 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884659 weight_norm_u: 25.222990 loss: 0.966402 +RANK_0 - 2026-01-29 02:56:48,187 - TRAIN-LOGGER - INFO - Epoch 539 - TRAIN - Minibatch 0: weight_norm_model: 143.884659 loss: 0.966402 grad_norm_before_clip: 4.733712 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:49,409 - TRAIN-LOGGER - INFO - Epoch 539 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884659 weight_norm_u: 25.218954 loss: 0.966402 grad_norm_before_clip: 4.733712 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:49,409 - TRAIN-LOGGER - INFO - Epoch 539 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884674 weight_norm_u: 25.222990 loss: 0.965134 +RANK_0 - 2026-01-29 02:56:53,718 - TRAIN-LOGGER - INFO - Epoch 540 - TRAIN - Minibatch 0: weight_norm_model: 143.884674 loss: 0.965134 grad_norm_before_clip: 1.045252 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:54,952 - TRAIN-LOGGER - INFO - Epoch 540 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884674 weight_norm_u: 25.218954 loss: 0.965134 grad_norm_before_clip: 1.045252 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:56:54,952 - TRAIN-LOGGER - INFO - Epoch 540 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884674 weight_norm_u: 25.222990 loss: 0.965217 +RANK_0 - 2026-01-29 02:56:59,281 - TRAIN-LOGGER - INFO - Epoch 541 - TRAIN - Minibatch 0: weight_norm_model: 143.884674 loss: 0.965217 grad_norm_before_clip: 2.156436 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:00,796 - TRAIN-LOGGER - INFO - Epoch 541 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884674 weight_norm_u: 25.218954 loss: 0.965217 grad_norm_before_clip: 2.156436 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:00,796 - TRAIN-LOGGER - INFO - Epoch 541 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884674 weight_norm_u: 25.222990 loss: 0.968766 +RANK_0 - 2026-01-29 02:57:04,999 - TRAIN-LOGGER - INFO - Epoch 542 - TRAIN - Minibatch 0: weight_norm_model: 143.884674 loss: 0.968766 grad_norm_before_clip: 5.444310 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:06,177 - TRAIN-LOGGER - INFO - Epoch 542 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884674 weight_norm_u: 25.218954 loss: 0.968766 grad_norm_before_clip: 5.444310 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:06,178 - TRAIN-LOGGER - INFO - Epoch 542 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884689 weight_norm_u: 25.222990 loss: 0.969791 +RANK_0 - 2026-01-29 02:57:10,759 - TRAIN-LOGGER - INFO - Epoch 543 - TRAIN - Minibatch 0: weight_norm_model: 143.884689 loss: 0.969791 grad_norm_before_clip: 6.138813 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:11,924 - TRAIN-LOGGER - INFO - Epoch 543 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884689 weight_norm_u: 25.218954 loss: 0.969791 grad_norm_before_clip: 6.138813 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:11,924 - TRAIN-LOGGER - INFO - Epoch 543 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884689 weight_norm_u: 25.222990 loss: 0.966273 +RANK_0 - 2026-01-29 02:57:16,971 - TRAIN-LOGGER - INFO - Epoch 544 - TRAIN - Minibatch 0: weight_norm_model: 143.884689 loss: 0.966273 grad_norm_before_clip: 3.121668 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:18,177 - TRAIN-LOGGER - INFO - Epoch 544 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884689 weight_norm_u: 25.218954 loss: 0.966273 grad_norm_before_clip: 3.121668 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:18,177 - TRAIN-LOGGER - INFO - Epoch 544 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884705 weight_norm_u: 25.222990 loss: 0.966770 +RANK_0 - 2026-01-29 02:57:22,802 - TRAIN-LOGGER - INFO - Epoch 545 - TRAIN - Minibatch 0: weight_norm_model: 143.884705 loss: 0.966770 grad_norm_before_clip: 4.140317 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:23,998 - TRAIN-LOGGER - INFO - Epoch 545 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884705 weight_norm_u: 25.218954 loss: 0.966770 grad_norm_before_clip: 4.140317 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:23,998 - TRAIN-LOGGER - INFO - Epoch 545 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884720 weight_norm_u: 25.222990 loss: 0.969236 +RANK_0 - 2026-01-29 02:57:28,976 - TRAIN-LOGGER - INFO - Epoch 546 - TRAIN - Minibatch 0: weight_norm_model: 143.884720 loss: 0.969236 grad_norm_before_clip: 4.433846 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:30,113 - TRAIN-LOGGER - INFO - Epoch 546 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884720 weight_norm_u: 25.218954 loss: 0.969236 grad_norm_before_clip: 4.433846 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:30,113 - TRAIN-LOGGER - INFO - Epoch 546 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884720 weight_norm_u: 25.222990 loss: 0.965803 +RANK_0 - 2026-01-29 02:57:34,955 - TRAIN-LOGGER - INFO - Epoch 547 - TRAIN - Minibatch 0: weight_norm_model: 143.884720 loss: 0.965803 grad_norm_before_clip: 3.120809 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:36,047 - TRAIN-LOGGER - INFO - Epoch 547 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884720 weight_norm_u: 25.218954 loss: 0.965803 grad_norm_before_clip: 3.120809 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:36,048 - TRAIN-LOGGER - INFO - Epoch 547 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884735 weight_norm_u: 25.222990 loss: 0.967952 +RANK_0 - 2026-01-29 02:57:41,057 - TRAIN-LOGGER - INFO - Epoch 548 - TRAIN - Minibatch 0: weight_norm_model: 143.884735 loss: 0.967952 grad_norm_before_clip: 4.162572 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:42,175 - TRAIN-LOGGER - INFO - Epoch 548 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884735 weight_norm_u: 25.218954 loss: 0.967952 grad_norm_before_clip: 4.162572 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:42,175 - TRAIN-LOGGER - INFO - Epoch 548 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884735 weight_norm_u: 25.222990 loss: 0.967103 +RANK_0 - 2026-01-29 02:57:47,677 - TRAIN-LOGGER - INFO - Epoch 549 - TRAIN - Minibatch 0: weight_norm_model: 143.884735 loss: 0.967103 grad_norm_before_clip: 5.023091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:48,808 - TRAIN-LOGGER - INFO - Epoch 549 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884735 weight_norm_u: 25.218954 loss: 0.967103 grad_norm_before_clip: 5.023091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:48,808 - TRAIN-LOGGER - INFO - Epoch 549 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884750 weight_norm_u: 25.222990 loss: 0.964886 +RANK_0 - 2026-01-29 02:57:53,913 - TRAIN-LOGGER - INFO - Epoch 550 - TRAIN - Minibatch 0: weight_norm_model: 143.884750 loss: 0.964886 grad_norm_before_clip: 2.695353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:55,129 - TRAIN-LOGGER - INFO - Epoch 550 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884750 weight_norm_u: 25.218954 loss: 0.964886 grad_norm_before_clip: 2.695353 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:57:55,130 - TRAIN-LOGGER - INFO - Epoch 550 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884766 weight_norm_u: 25.222990 loss: 0.968761 +RANK_0 - 2026-01-29 02:57:59,487 - TRAIN-LOGGER - INFO - Epoch 551 - TRAIN - Minibatch 0: weight_norm_model: 143.884766 loss: 0.968761 grad_norm_before_clip: 4.786022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:00,618 - TRAIN-LOGGER - INFO - Epoch 551 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884766 weight_norm_u: 25.218954 loss: 0.968761 grad_norm_before_clip: 4.786022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:00,618 - TRAIN-LOGGER - INFO - Epoch 551 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884781 weight_norm_u: 25.222990 loss: 0.971519 +RANK_0 - 2026-01-29 02:58:05,770 - TRAIN-LOGGER - INFO - Epoch 552 - TRAIN - Minibatch 0: weight_norm_model: 143.884781 loss: 0.971519 grad_norm_before_clip: 5.018137 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:06,930 - TRAIN-LOGGER - INFO - Epoch 552 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884781 weight_norm_u: 25.218954 loss: 0.971519 grad_norm_before_clip: 5.018137 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:06,931 - TRAIN-LOGGER - INFO - Epoch 552 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884781 weight_norm_u: 25.222990 loss: 0.968775 +RANK_0 - 2026-01-29 02:58:11,642 - TRAIN-LOGGER - INFO - Epoch 553 - TRAIN - Minibatch 0: weight_norm_model: 143.884781 loss: 0.968775 grad_norm_before_clip: 4.889678 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:12,840 - TRAIN-LOGGER - INFO - Epoch 553 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884781 weight_norm_u: 25.218954 loss: 0.968775 grad_norm_before_clip: 4.889678 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:12,840 - TRAIN-LOGGER - INFO - Epoch 553 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884781 weight_norm_u: 25.222990 loss: 0.964896 +RANK_0 - 2026-01-29 02:58:17,547 - TRAIN-LOGGER - INFO - Epoch 554 - TRAIN - Minibatch 0: weight_norm_model: 143.884781 loss: 0.964896 grad_norm_before_clip: 4.478159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:18,745 - TRAIN-LOGGER - INFO - Epoch 554 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884781 weight_norm_u: 25.218954 loss: 0.964896 grad_norm_before_clip: 4.478159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:18,745 - TRAIN-LOGGER - INFO - Epoch 554 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884781 weight_norm_u: 25.222990 loss: 0.967374 +RANK_0 - 2026-01-29 02:58:23,083 - TRAIN-LOGGER - INFO - Epoch 555 - TRAIN - Minibatch 0: weight_norm_model: 143.884781 loss: 0.967374 grad_norm_before_clip: 5.418555 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:24,308 - TRAIN-LOGGER - INFO - Epoch 555 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884781 weight_norm_u: 25.218954 loss: 0.967374 grad_norm_before_clip: 5.418555 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:24,309 - TRAIN-LOGGER - INFO - Epoch 555 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884796 weight_norm_u: 25.222990 loss: 0.964957 +RANK_0 - 2026-01-29 02:58:29,347 - TRAIN-LOGGER - INFO - Epoch 556 - TRAIN - Minibatch 0: weight_norm_model: 143.884796 loss: 0.964957 grad_norm_before_clip: 1.816116 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:30,537 - TRAIN-LOGGER - INFO - Epoch 556 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884796 weight_norm_u: 25.218954 loss: 0.964957 grad_norm_before_clip: 1.816116 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:30,537 - TRAIN-LOGGER - INFO - Epoch 556 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884796 weight_norm_u: 25.222990 loss: 0.965757 +RANK_0 - 2026-01-29 02:58:35,053 - TRAIN-LOGGER - INFO - Epoch 557 - TRAIN - Minibatch 0: weight_norm_model: 143.884796 loss: 0.965757 grad_norm_before_clip: 3.436115 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:36,237 - TRAIN-LOGGER - INFO - Epoch 557 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884796 weight_norm_u: 25.218954 loss: 0.965757 grad_norm_before_clip: 3.436115 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:36,237 - TRAIN-LOGGER - INFO - Epoch 557 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884796 weight_norm_u: 25.222990 loss: 0.965521 +RANK_0 - 2026-01-29 02:58:41,084 - TRAIN-LOGGER - INFO - Epoch 558 - TRAIN - Minibatch 0: weight_norm_model: 143.884796 loss: 0.965521 grad_norm_before_clip: 2.772805 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:42,318 - TRAIN-LOGGER - INFO - Epoch 558 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884796 weight_norm_u: 25.218954 loss: 0.965521 grad_norm_before_clip: 2.772805 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:42,318 - TRAIN-LOGGER - INFO - Epoch 558 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884796 weight_norm_u: 25.222990 loss: 0.965182 +RANK_0 - 2026-01-29 02:58:47,117 - TRAIN-LOGGER - INFO - Epoch 559 - TRAIN - Minibatch 0: weight_norm_model: 143.884796 loss: 0.965182 grad_norm_before_clip: 3.163972 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:48,257 - TRAIN-LOGGER - INFO - Epoch 559 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884796 weight_norm_u: 25.218954 loss: 0.965182 grad_norm_before_clip: 3.163972 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:48,257 - TRAIN-LOGGER - INFO - Epoch 559 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884811 weight_norm_u: 25.222990 loss: 0.965753 +RANK_0 - 2026-01-29 02:58:53,017 - TRAIN-LOGGER - INFO - Epoch 560 - TRAIN - Minibatch 0: weight_norm_model: 143.884811 loss: 0.965753 grad_norm_before_clip: 3.559381 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:54,256 - TRAIN-LOGGER - INFO - Epoch 560 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884811 weight_norm_u: 25.218954 loss: 0.965753 grad_norm_before_clip: 3.559381 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:58:54,257 - TRAIN-LOGGER - INFO - Epoch 560 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884827 weight_norm_u: 25.222990 loss: 0.965539 +RANK_0 - 2026-01-29 02:58:59,218 - TRAIN-LOGGER - INFO - Epoch 561 - TRAIN - Minibatch 0: weight_norm_model: 143.884827 loss: 0.965539 grad_norm_before_clip: 3.096956 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:00,378 - TRAIN-LOGGER - INFO - Epoch 561 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884827 weight_norm_u: 25.218954 loss: 0.965539 grad_norm_before_clip: 3.096956 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:00,378 - TRAIN-LOGGER - INFO - Epoch 561 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884842 weight_norm_u: 25.222990 loss: 0.965867 +RANK_0 - 2026-01-29 02:59:05,451 - TRAIN-LOGGER - INFO - Epoch 562 - TRAIN - Minibatch 0: weight_norm_model: 143.884842 loss: 0.965867 grad_norm_before_clip: 4.601649 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:06,887 - TRAIN-LOGGER - INFO - Epoch 562 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884842 weight_norm_u: 25.218954 loss: 0.965867 grad_norm_before_clip: 4.601649 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:06,888 - TRAIN-LOGGER - INFO - Epoch 562 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884842 weight_norm_u: 25.222990 loss: 0.963417 +RANK_0 - 2026-01-29 02:59:12,434 - TRAIN-LOGGER - INFO - Epoch 563 - TRAIN - Minibatch 0: weight_norm_model: 143.884842 loss: 0.963417 grad_norm_before_clip: 1.106500 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:13,585 - TRAIN-LOGGER - INFO - Epoch 563 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884842 weight_norm_u: 25.218954 loss: 0.963417 grad_norm_before_clip: 1.106500 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:13,585 - TRAIN-LOGGER - INFO - Epoch 563 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884857 weight_norm_u: 25.222990 loss: 0.964920 +RANK_0 - 2026-01-29 02:59:18,749 - TRAIN-LOGGER - INFO - Epoch 564 - TRAIN - Minibatch 0: weight_norm_model: 143.884857 loss: 0.964920 grad_norm_before_clip: 3.245806 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:19,920 - TRAIN-LOGGER - INFO - Epoch 564 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884857 weight_norm_u: 25.218954 loss: 0.964920 grad_norm_before_clip: 3.245806 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:19,920 - TRAIN-LOGGER - INFO - Epoch 564 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884872 weight_norm_u: 25.222990 loss: 0.965226 +RANK_0 - 2026-01-29 02:59:24,811 - TRAIN-LOGGER - INFO - Epoch 565 - TRAIN - Minibatch 0: weight_norm_model: 143.884872 loss: 0.965226 grad_norm_before_clip: 3.661525 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:26,037 - TRAIN-LOGGER - INFO - Epoch 565 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884872 weight_norm_u: 25.218954 loss: 0.965226 grad_norm_before_clip: 3.661525 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:26,037 - TRAIN-LOGGER - INFO - Epoch 565 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884903 weight_norm_u: 25.222990 loss: 0.963867 +RANK_0 - 2026-01-29 02:59:30,656 - TRAIN-LOGGER - INFO - Epoch 566 - TRAIN - Minibatch 0: weight_norm_model: 143.884903 loss: 0.963867 grad_norm_before_clip: 1.937802 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:31,948 - TRAIN-LOGGER - INFO - Epoch 566 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884903 weight_norm_u: 25.218954 loss: 0.963867 grad_norm_before_clip: 1.937802 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:31,948 - TRAIN-LOGGER - INFO - Epoch 566 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884918 weight_norm_u: 25.222990 loss: 0.966979 +RANK_0 - 2026-01-29 02:59:36,233 - TRAIN-LOGGER - INFO - Epoch 567 - TRAIN - Minibatch 0: weight_norm_model: 143.884918 loss: 0.966979 grad_norm_before_clip: 4.541801 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:37,505 - TRAIN-LOGGER - INFO - Epoch 567 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884918 weight_norm_u: 25.218954 loss: 0.966979 grad_norm_before_clip: 4.541801 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:37,505 - TRAIN-LOGGER - INFO - Epoch 567 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884933 weight_norm_u: 25.222990 loss: 0.965389 +RANK_0 - 2026-01-29 02:59:41,908 - TRAIN-LOGGER - INFO - Epoch 568 - TRAIN - Minibatch 0: weight_norm_model: 143.884933 loss: 0.965389 grad_norm_before_clip: 2.709078 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:43,326 - TRAIN-LOGGER - INFO - Epoch 568 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884933 weight_norm_u: 25.218954 loss: 0.965389 grad_norm_before_clip: 2.709078 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:43,327 - TRAIN-LOGGER - INFO - Epoch 568 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884918 weight_norm_u: 25.222990 loss: 0.963689 +RANK_0 - 2026-01-29 02:59:47,512 - TRAIN-LOGGER - INFO - Epoch 569 - TRAIN - Minibatch 0: weight_norm_model: 143.884918 loss: 0.963689 grad_norm_before_clip: 1.656553 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:48,737 - TRAIN-LOGGER - INFO - Epoch 569 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884918 weight_norm_u: 25.218954 loss: 0.963689 grad_norm_before_clip: 1.656553 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:48,738 - TRAIN-LOGGER - INFO - Epoch 569 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884903 weight_norm_u: 25.222990 loss: 0.964440 +RANK_0 - 2026-01-29 02:59:53,486 - TRAIN-LOGGER - INFO - Epoch 570 - TRAIN - Minibatch 0: weight_norm_model: 143.884903 loss: 0.964440 grad_norm_before_clip: 2.347895 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:54,986 - TRAIN-LOGGER - INFO - Epoch 570 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884903 weight_norm_u: 25.218954 loss: 0.964440 grad_norm_before_clip: 2.347895 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 02:59:54,987 - TRAIN-LOGGER - INFO - Epoch 570 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884918 weight_norm_u: 25.222990 loss: 0.965626 +RANK_0 - 2026-01-29 02:59:59,418 - TRAIN-LOGGER - INFO - Epoch 571 - TRAIN - Minibatch 0: weight_norm_model: 143.884918 loss: 0.965626 grad_norm_before_clip: 3.885992 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:00,654 - TRAIN-LOGGER - INFO - Epoch 571 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884918 weight_norm_u: 25.218954 loss: 0.965626 grad_norm_before_clip: 3.885992 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:00,654 - TRAIN-LOGGER - INFO - Epoch 571 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884918 weight_norm_u: 25.222990 loss: 0.965304 +RANK_0 - 2026-01-29 03:00:05,032 - TRAIN-LOGGER - INFO - Epoch 572 - TRAIN - Minibatch 0: weight_norm_model: 143.884918 loss: 0.965304 grad_norm_before_clip: 3.214391 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:06,420 - TRAIN-LOGGER - INFO - Epoch 572 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884918 weight_norm_u: 25.218954 loss: 0.965304 grad_norm_before_clip: 3.214391 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:06,421 - TRAIN-LOGGER - INFO - Epoch 572 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884933 weight_norm_u: 25.222990 loss: 0.964190 +RANK_0 - 2026-01-29 03:00:10,662 - TRAIN-LOGGER - INFO - Epoch 573 - TRAIN - Minibatch 0: weight_norm_model: 143.884933 loss: 0.964190 grad_norm_before_clip: 3.194554 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:11,871 - TRAIN-LOGGER - INFO - Epoch 573 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884933 weight_norm_u: 25.218954 loss: 0.964190 grad_norm_before_clip: 3.194554 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:11,871 - TRAIN-LOGGER - INFO - Epoch 573 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884933 weight_norm_u: 25.222990 loss: 0.964730 +RANK_0 - 2026-01-29 03:00:16,671 - TRAIN-LOGGER - INFO - Epoch 574 - TRAIN - Minibatch 0: weight_norm_model: 143.884933 loss: 0.964730 grad_norm_before_clip: 2.132138 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:17,834 - TRAIN-LOGGER - INFO - Epoch 574 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884933 weight_norm_u: 25.218954 loss: 0.964730 grad_norm_before_clip: 2.132138 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:17,834 - TRAIN-LOGGER - INFO - Epoch 574 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884933 weight_norm_u: 25.222990 loss: 0.966331 +RANK_0 - 2026-01-29 03:00:23,474 - TRAIN-LOGGER - INFO - Epoch 575 - TRAIN - Minibatch 0: weight_norm_model: 143.884933 loss: 0.966331 grad_norm_before_clip: 3.558288 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:24,757 - TRAIN-LOGGER - INFO - Epoch 575 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884933 weight_norm_u: 25.218954 loss: 0.966331 grad_norm_before_clip: 3.558288 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:24,758 - TRAIN-LOGGER - INFO - Epoch 575 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884949 weight_norm_u: 25.222990 loss: 0.965868 +RANK_0 - 2026-01-29 03:00:29,696 - TRAIN-LOGGER - INFO - Epoch 576 - TRAIN - Minibatch 0: weight_norm_model: 143.884949 loss: 0.965868 grad_norm_before_clip: 1.960653 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:31,265 - TRAIN-LOGGER - INFO - Epoch 576 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884949 weight_norm_u: 25.218954 loss: 0.965868 grad_norm_before_clip: 1.960653 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:31,265 - TRAIN-LOGGER - INFO - Epoch 576 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884964 weight_norm_u: 25.222990 loss: 0.966753 +RANK_0 - 2026-01-29 03:00:36,456 - TRAIN-LOGGER - INFO - Epoch 577 - TRAIN - Minibatch 0: weight_norm_model: 143.884964 loss: 0.966753 grad_norm_before_clip: 4.339009 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:37,681 - TRAIN-LOGGER - INFO - Epoch 577 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884964 weight_norm_u: 25.218954 loss: 0.966753 grad_norm_before_clip: 4.339009 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:37,681 - TRAIN-LOGGER - INFO - Epoch 577 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884964 weight_norm_u: 25.222990 loss: 0.964329 +RANK_0 - 2026-01-29 03:00:42,458 - TRAIN-LOGGER - INFO - Epoch 578 - TRAIN - Minibatch 0: weight_norm_model: 143.884964 loss: 0.964329 grad_norm_before_clip: 2.136075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:43,895 - TRAIN-LOGGER - INFO - Epoch 578 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884964 weight_norm_u: 25.218954 loss: 0.964329 grad_norm_before_clip: 2.136075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:43,896 - TRAIN-LOGGER - INFO - Epoch 578 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884979 weight_norm_u: 25.222990 loss: 0.963554 +RANK_0 - 2026-01-29 03:00:48,512 - TRAIN-LOGGER - INFO - Epoch 579 - TRAIN - Minibatch 0: weight_norm_model: 143.884979 loss: 0.963554 grad_norm_before_clip: 1.767629 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:49,710 - TRAIN-LOGGER - INFO - Epoch 579 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884979 weight_norm_u: 25.218954 loss: 0.963554 grad_norm_before_clip: 1.767629 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:49,711 - TRAIN-LOGGER - INFO - Epoch 579 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884979 weight_norm_u: 25.222990 loss: 0.964940 +RANK_0 - 2026-01-29 03:00:53,853 - TRAIN-LOGGER - INFO - Epoch 580 - TRAIN - Minibatch 0: weight_norm_model: 143.884979 loss: 0.964940 grad_norm_before_clip: 3.136748 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:55,010 - TRAIN-LOGGER - INFO - Epoch 580 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884979 weight_norm_u: 25.218954 loss: 0.964940 grad_norm_before_clip: 3.136748 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:00:55,010 - TRAIN-LOGGER - INFO - Epoch 580 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.884979 weight_norm_u: 25.222990 loss: 0.964797 +RANK_0 - 2026-01-29 03:00:59,414 - TRAIN-LOGGER - INFO - Epoch 581 - TRAIN - Minibatch 0: weight_norm_model: 143.884979 loss: 0.964797 grad_norm_before_clip: 2.465601 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:00,551 - TRAIN-LOGGER - INFO - Epoch 581 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.884979 weight_norm_u: 25.218954 loss: 0.964797 grad_norm_before_clip: 2.465601 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:00,552 - TRAIN-LOGGER - INFO - Epoch 581 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885010 weight_norm_u: 25.222990 loss: 0.964269 +RANK_0 - 2026-01-29 03:01:05,261 - TRAIN-LOGGER - INFO - Epoch 582 - TRAIN - Minibatch 0: weight_norm_model: 143.885010 loss: 0.964269 grad_norm_before_clip: 2.940828 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:06,401 - TRAIN-LOGGER - INFO - Epoch 582 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885010 weight_norm_u: 25.218954 loss: 0.964269 grad_norm_before_clip: 2.940828 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:06,402 - TRAIN-LOGGER - INFO - Epoch 582 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885010 weight_norm_u: 25.222990 loss: 0.963527 +RANK_0 - 2026-01-29 03:01:10,803 - TRAIN-LOGGER - INFO - Epoch 583 - TRAIN - Minibatch 0: weight_norm_model: 143.885010 loss: 0.963527 grad_norm_before_clip: 3.559259 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:11,981 - TRAIN-LOGGER - INFO - Epoch 583 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885010 weight_norm_u: 25.218954 loss: 0.963527 grad_norm_before_clip: 3.559259 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:11,981 - TRAIN-LOGGER - INFO - Epoch 583 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885025 weight_norm_u: 25.222990 loss: 0.966343 +RANK_0 - 2026-01-29 03:01:16,724 - TRAIN-LOGGER - INFO - Epoch 584 - TRAIN - Minibatch 0: weight_norm_model: 143.885025 loss: 0.966343 grad_norm_before_clip: 4.947016 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:17,884 - TRAIN-LOGGER - INFO - Epoch 584 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885025 weight_norm_u: 25.218954 loss: 0.966343 grad_norm_before_clip: 4.947016 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:17,885 - TRAIN-LOGGER - INFO - Epoch 584 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885025 weight_norm_u: 25.222990 loss: 0.968292 +RANK_0 - 2026-01-29 03:01:23,125 - TRAIN-LOGGER - INFO - Epoch 585 - TRAIN - Minibatch 0: weight_norm_model: 143.885025 loss: 0.968292 grad_norm_before_clip: 5.439017 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:24,330 - TRAIN-LOGGER - INFO - Epoch 585 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885025 weight_norm_u: 25.218954 loss: 0.968292 grad_norm_before_clip: 5.439017 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:24,331 - TRAIN-LOGGER - INFO - Epoch 585 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885040 weight_norm_u: 25.222990 loss: 0.964558 +RANK_0 - 2026-01-29 03:01:29,299 - TRAIN-LOGGER - INFO - Epoch 586 - TRAIN - Minibatch 0: weight_norm_model: 143.885040 loss: 0.964558 grad_norm_before_clip: 3.426365 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:30,439 - TRAIN-LOGGER - INFO - Epoch 586 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885040 weight_norm_u: 25.218954 loss: 0.964558 grad_norm_before_clip: 3.426365 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:30,439 - TRAIN-LOGGER - INFO - Epoch 586 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885071 weight_norm_u: 25.222990 loss: 0.963952 +RANK_0 - 2026-01-29 03:01:35,984 - TRAIN-LOGGER - INFO - Epoch 587 - TRAIN - Minibatch 0: weight_norm_model: 143.885071 loss: 0.963952 grad_norm_before_clip: 2.103439 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:37,099 - TRAIN-LOGGER - INFO - Epoch 587 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885071 weight_norm_u: 25.218954 loss: 0.963952 grad_norm_before_clip: 2.103439 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:37,099 - TRAIN-LOGGER - INFO - Epoch 587 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.964905 +RANK_0 - 2026-01-29 03:01:41,617 - TRAIN-LOGGER - INFO - Epoch 588 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.964905 grad_norm_before_clip: 3.026767 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:42,764 - TRAIN-LOGGER - INFO - Epoch 588 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.964905 grad_norm_before_clip: 3.026767 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:42,764 - TRAIN-LOGGER - INFO - Epoch 588 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.966328 +RANK_0 - 2026-01-29 03:01:48,103 - TRAIN-LOGGER - INFO - Epoch 589 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.966328 grad_norm_before_clip: 5.263725 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:49,288 - TRAIN-LOGGER - INFO - Epoch 589 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.966328 grad_norm_before_clip: 5.263725 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:49,288 - TRAIN-LOGGER - INFO - Epoch 589 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.969606 +RANK_0 - 2026-01-29 03:01:55,325 - TRAIN-LOGGER - INFO - Epoch 590 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.969606 grad_norm_before_clip: 7.260219 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:56,519 - TRAIN-LOGGER - INFO - Epoch 590 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.969606 grad_norm_before_clip: 7.260219 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:01:56,520 - TRAIN-LOGGER - INFO - Epoch 590 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.964702 +RANK_0 - 2026-01-29 03:02:01,698 - TRAIN-LOGGER - INFO - Epoch 591 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.964702 grad_norm_before_clip: 2.316998 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:02,862 - TRAIN-LOGGER - INFO - Epoch 591 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.964702 grad_norm_before_clip: 2.316998 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:02,862 - TRAIN-LOGGER - INFO - Epoch 591 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.966668 +RANK_0 - 2026-01-29 03:02:07,791 - TRAIN-LOGGER - INFO - Epoch 592 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.966668 grad_norm_before_clip: 4.301847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:08,981 - TRAIN-LOGGER - INFO - Epoch 592 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.966668 grad_norm_before_clip: 4.301847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:08,981 - TRAIN-LOGGER - INFO - Epoch 592 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.968870 +RANK_0 - 2026-01-29 03:02:13,450 - TRAIN-LOGGER - INFO - Epoch 593 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.968870 grad_norm_before_clip: 4.754157 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:14,660 - TRAIN-LOGGER - INFO - Epoch 593 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.968870 grad_norm_before_clip: 4.754157 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:14,660 - TRAIN-LOGGER - INFO - Epoch 593 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.965581 +RANK_0 - 2026-01-29 03:02:18,857 - TRAIN-LOGGER - INFO - Epoch 594 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.965581 grad_norm_before_clip: 2.562081 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:20,043 - TRAIN-LOGGER - INFO - Epoch 594 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.965581 grad_norm_before_clip: 2.562081 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:20,043 - TRAIN-LOGGER - INFO - Epoch 594 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885071 weight_norm_u: 25.222990 loss: 0.966063 +RANK_0 - 2026-01-29 03:02:24,513 - TRAIN-LOGGER - INFO - Epoch 595 - TRAIN - Minibatch 0: weight_norm_model: 143.885071 loss: 0.966063 grad_norm_before_clip: 4.058980 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:25,735 - TRAIN-LOGGER - INFO - Epoch 595 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885071 weight_norm_u: 25.218954 loss: 0.966063 grad_norm_before_clip: 4.058980 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:25,735 - TRAIN-LOGGER - INFO - Epoch 595 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.966661 +RANK_0 - 2026-01-29 03:02:30,240 - TRAIN-LOGGER - INFO - Epoch 596 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.966661 grad_norm_before_clip: 5.484640 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:31,379 - TRAIN-LOGGER - INFO - Epoch 596 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.966661 grad_norm_before_clip: 5.484640 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:31,379 - TRAIN-LOGGER - INFO - Epoch 596 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885086 weight_norm_u: 25.222990 loss: 0.965341 +RANK_0 - 2026-01-29 03:02:36,407 - TRAIN-LOGGER - INFO - Epoch 597 - TRAIN - Minibatch 0: weight_norm_model: 143.885086 loss: 0.965341 grad_norm_before_clip: 1.844000 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:37,577 - TRAIN-LOGGER - INFO - Epoch 597 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885086 weight_norm_u: 25.218954 loss: 0.965341 grad_norm_before_clip: 1.844000 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:37,578 - TRAIN-LOGGER - INFO - Epoch 597 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885117 weight_norm_u: 25.222990 loss: 0.965751 +RANK_0 - 2026-01-29 03:02:42,270 - TRAIN-LOGGER - INFO - Epoch 598 - TRAIN - Minibatch 0: weight_norm_model: 143.885117 loss: 0.965751 grad_norm_before_clip: 4.486014 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:43,505 - TRAIN-LOGGER - INFO - Epoch 598 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885117 weight_norm_u: 25.218954 loss: 0.965751 grad_norm_before_clip: 4.486014 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:43,506 - TRAIN-LOGGER - INFO - Epoch 598 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885132 weight_norm_u: 25.222990 loss: 0.966119 +RANK_0 - 2026-01-29 03:02:48,526 - TRAIN-LOGGER - INFO - Epoch 599 - TRAIN - Minibatch 0: weight_norm_model: 143.885132 loss: 0.966119 grad_norm_before_clip: 4.523272 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:49,739 - TRAIN-LOGGER - INFO - Epoch 599 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885132 weight_norm_u: 25.218954 loss: 0.966119 grad_norm_before_clip: 4.523272 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:49,740 - TRAIN-LOGGER - INFO - Epoch 599 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885147 weight_norm_u: 25.222990 loss: 0.963808 +RANK_0 - 2026-01-29 03:02:54,249 - TRAIN-LOGGER - INFO - Epoch 600 - TRAIN - Minibatch 0: weight_norm_model: 143.885147 loss: 0.963808 grad_norm_before_clip: 1.441362 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:55,478 - TRAIN-LOGGER - INFO - Epoch 600 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885147 weight_norm_u: 25.218954 loss: 0.963808 grad_norm_before_clip: 1.441362 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:02:55,478 - TRAIN-LOGGER - INFO - Epoch 600 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885162 weight_norm_u: 25.222990 loss: 0.965458 +RANK_0 - 2026-01-29 03:03:00,410 - TRAIN-LOGGER - INFO - Epoch 601 - TRAIN - Minibatch 0: weight_norm_model: 143.885162 loss: 0.965458 grad_norm_before_clip: 4.417763 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:01,617 - TRAIN-LOGGER - INFO - Epoch 601 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885162 weight_norm_u: 25.218954 loss: 0.965458 grad_norm_before_clip: 4.417763 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:01,617 - TRAIN-LOGGER - INFO - Epoch 601 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885178 weight_norm_u: 25.222990 loss: 0.965555 +RANK_0 - 2026-01-29 03:03:06,054 - TRAIN-LOGGER - INFO - Epoch 602 - TRAIN - Minibatch 0: weight_norm_model: 143.885178 loss: 0.965555 grad_norm_before_clip: 4.288884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:07,165 - TRAIN-LOGGER - INFO - Epoch 602 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885178 weight_norm_u: 25.218954 loss: 0.965555 grad_norm_before_clip: 4.288884 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:07,165 - TRAIN-LOGGER - INFO - Epoch 602 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885193 weight_norm_u: 25.222990 loss: 0.965831 +RANK_0 - 2026-01-29 03:03:11,741 - TRAIN-LOGGER - INFO - Epoch 603 - TRAIN - Minibatch 0: weight_norm_model: 143.885193 loss: 0.965831 grad_norm_before_clip: 4.028219 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:12,977 - TRAIN-LOGGER - INFO - Epoch 603 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885193 weight_norm_u: 25.218954 loss: 0.965831 grad_norm_before_clip: 4.028219 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:12,978 - TRAIN-LOGGER - INFO - Epoch 603 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885208 weight_norm_u: 25.222990 loss: 0.964967 +RANK_0 - 2026-01-29 03:03:18,147 - TRAIN-LOGGER - INFO - Epoch 604 - TRAIN - Minibatch 0: weight_norm_model: 143.885208 loss: 0.964967 grad_norm_before_clip: 4.062179 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:19,346 - TRAIN-LOGGER - INFO - Epoch 604 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885208 weight_norm_u: 25.218954 loss: 0.964967 grad_norm_before_clip: 4.062179 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:19,346 - TRAIN-LOGGER - INFO - Epoch 604 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885208 weight_norm_u: 25.222990 loss: 0.964515 +RANK_0 - 2026-01-29 03:03:24,020 - TRAIN-LOGGER - INFO - Epoch 605 - TRAIN - Minibatch 0: weight_norm_model: 143.885208 loss: 0.964515 grad_norm_before_clip: 4.413228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:25,213 - TRAIN-LOGGER - INFO - Epoch 605 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885208 weight_norm_u: 25.218954 loss: 0.964515 grad_norm_before_clip: 4.413228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:25,213 - TRAIN-LOGGER - INFO - Epoch 605 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885223 weight_norm_u: 25.222990 loss: 0.965035 +RANK_0 - 2026-01-29 03:03:30,156 - TRAIN-LOGGER - INFO - Epoch 606 - TRAIN - Minibatch 0: weight_norm_model: 143.885223 loss: 0.965035 grad_norm_before_clip: 4.015016 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:31,303 - TRAIN-LOGGER - INFO - Epoch 606 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885223 weight_norm_u: 25.218954 loss: 0.965035 grad_norm_before_clip: 4.015016 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:31,303 - TRAIN-LOGGER - INFO - Epoch 606 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.964728 +RANK_0 - 2026-01-29 03:03:35,851 - TRAIN-LOGGER - INFO - Epoch 607 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.964728 grad_norm_before_clip: 1.955615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:37,104 - TRAIN-LOGGER - INFO - Epoch 607 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.964728 grad_norm_before_clip: 1.955615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:37,105 - TRAIN-LOGGER - INFO - Epoch 607 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.964776 +RANK_0 - 2026-01-29 03:03:42,163 - TRAIN-LOGGER - INFO - Epoch 608 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.964776 grad_norm_before_clip: 4.444043 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:43,318 - TRAIN-LOGGER - INFO - Epoch 608 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.964776 grad_norm_before_clip: 4.444043 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:43,318 - TRAIN-LOGGER - INFO - Epoch 608 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.963795 +RANK_0 - 2026-01-29 03:03:52,133 - TRAIN-LOGGER - INFO - Epoch 609 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.963795 grad_norm_before_clip: 2.111020 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:53,618 - TRAIN-LOGGER - INFO - Epoch 609 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.963795 grad_norm_before_clip: 2.111020 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:53,619 - TRAIN-LOGGER - INFO - Epoch 609 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885223 weight_norm_u: 25.222990 loss: 0.965280 +RANK_0 - 2026-01-29 03:03:58,156 - TRAIN-LOGGER - INFO - Epoch 610 - TRAIN - Minibatch 0: weight_norm_model: 143.885223 loss: 0.965280 grad_norm_before_clip: 3.887912 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:59,340 - TRAIN-LOGGER - INFO - Epoch 610 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885223 weight_norm_u: 25.218954 loss: 0.965280 grad_norm_before_clip: 3.887912 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:03:59,341 - TRAIN-LOGGER - INFO - Epoch 610 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885223 weight_norm_u: 25.222990 loss: 0.962836 +RANK_0 - 2026-01-29 03:04:03,959 - TRAIN-LOGGER - INFO - Epoch 611 - TRAIN - Minibatch 0: weight_norm_model: 143.885223 loss: 0.962836 grad_norm_before_clip: 2.186158 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:05,432 - TRAIN-LOGGER - INFO - Epoch 611 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885223 weight_norm_u: 25.218954 loss: 0.962836 grad_norm_before_clip: 2.186158 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:05,432 - TRAIN-LOGGER - INFO - Epoch 611 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885223 weight_norm_u: 25.222990 loss: 0.966499 +RANK_0 - 2026-01-29 03:04:09,982 - TRAIN-LOGGER - INFO - Epoch 612 - TRAIN - Minibatch 0: weight_norm_model: 143.885223 loss: 0.966499 grad_norm_before_clip: 4.473986 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:11,088 - TRAIN-LOGGER - INFO - Epoch 612 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885223 weight_norm_u: 25.218954 loss: 0.966499 grad_norm_before_clip: 4.473986 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:11,088 - TRAIN-LOGGER - INFO - Epoch 612 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.967622 +RANK_0 - 2026-01-29 03:04:15,473 - TRAIN-LOGGER - INFO - Epoch 613 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.967622 grad_norm_before_clip: 4.674344 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:16,725 - TRAIN-LOGGER - INFO - Epoch 613 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.967622 grad_norm_before_clip: 4.674344 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:16,725 - TRAIN-LOGGER - INFO - Epoch 613 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.964205 +RANK_0 - 2026-01-29 03:04:21,580 - TRAIN-LOGGER - INFO - Epoch 614 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.964205 grad_norm_before_clip: 4.216247 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:22,725 - TRAIN-LOGGER - INFO - Epoch 614 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.964205 grad_norm_before_clip: 4.216247 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:22,725 - TRAIN-LOGGER - INFO - Epoch 614 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.965968 +RANK_0 - 2026-01-29 03:04:26,957 - TRAIN-LOGGER - INFO - Epoch 615 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.965968 grad_norm_before_clip: 5.066421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:28,181 - TRAIN-LOGGER - INFO - Epoch 615 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.965968 grad_norm_before_clip: 5.066421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:28,181 - TRAIN-LOGGER - INFO - Epoch 615 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.968040 +RANK_0 - 2026-01-29 03:04:33,100 - TRAIN-LOGGER - INFO - Epoch 616 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.968040 grad_norm_before_clip: 6.721235 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:34,208 - TRAIN-LOGGER - INFO - Epoch 616 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.968040 grad_norm_before_clip: 6.721235 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:34,208 - TRAIN-LOGGER - INFO - Epoch 616 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885239 weight_norm_u: 25.222990 loss: 0.964232 +RANK_0 - 2026-01-29 03:04:38,254 - TRAIN-LOGGER - INFO - Epoch 617 - TRAIN - Minibatch 0: weight_norm_model: 143.885239 loss: 0.964232 grad_norm_before_clip: 1.997753 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:39,377 - TRAIN-LOGGER - INFO - Epoch 617 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885239 weight_norm_u: 25.218954 loss: 0.964232 grad_norm_before_clip: 1.997753 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:39,377 - TRAIN-LOGGER - INFO - Epoch 617 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885254 weight_norm_u: 25.222990 loss: 0.964134 +RANK_0 - 2026-01-29 03:04:44,007 - TRAIN-LOGGER - INFO - Epoch 618 - TRAIN - Minibatch 0: weight_norm_model: 143.885254 loss: 0.964134 grad_norm_before_clip: 3.050411 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:45,212 - TRAIN-LOGGER - INFO - Epoch 618 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885254 weight_norm_u: 25.218954 loss: 0.964134 grad_norm_before_clip: 3.050411 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:45,212 - TRAIN-LOGGER - INFO - Epoch 618 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885254 weight_norm_u: 25.222990 loss: 0.964873 +RANK_0 - 2026-01-29 03:04:50,264 - TRAIN-LOGGER - INFO - Epoch 619 - TRAIN - Minibatch 0: weight_norm_model: 143.885254 loss: 0.964873 grad_norm_before_clip: 4.030063 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:51,481 - TRAIN-LOGGER - INFO - Epoch 619 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885254 weight_norm_u: 25.218954 loss: 0.964873 grad_norm_before_clip: 4.030063 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:51,481 - TRAIN-LOGGER - INFO - Epoch 619 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885254 weight_norm_u: 25.222990 loss: 0.963668 +RANK_0 - 2026-01-29 03:04:56,531 - TRAIN-LOGGER - INFO - Epoch 620 - TRAIN - Minibatch 0: weight_norm_model: 143.885254 loss: 0.963668 grad_norm_before_clip: 1.569847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:57,679 - TRAIN-LOGGER - INFO - Epoch 620 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885254 weight_norm_u: 25.218954 loss: 0.963668 grad_norm_before_clip: 1.569847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:04:57,679 - TRAIN-LOGGER - INFO - Epoch 620 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885269 weight_norm_u: 25.222990 loss: 0.963303 +RANK_0 - 2026-01-29 03:05:02,519 - TRAIN-LOGGER - INFO - Epoch 621 - TRAIN - Minibatch 0: weight_norm_model: 143.885269 loss: 0.963303 grad_norm_before_clip: 1.616497 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:03,650 - TRAIN-LOGGER - INFO - Epoch 621 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885269 weight_norm_u: 25.218954 loss: 0.963303 grad_norm_before_clip: 1.616497 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:03,650 - TRAIN-LOGGER - INFO - Epoch 621 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885269 weight_norm_u: 25.222990 loss: 0.962862 +RANK_0 - 2026-01-29 03:05:07,957 - TRAIN-LOGGER - INFO - Epoch 622 - TRAIN - Minibatch 0: weight_norm_model: 143.885269 loss: 0.962862 grad_norm_before_clip: 2.734397 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:09,375 - TRAIN-LOGGER - INFO - Epoch 622 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885269 weight_norm_u: 25.218954 loss: 0.962862 grad_norm_before_clip: 2.734397 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:09,375 - TRAIN-LOGGER - INFO - Epoch 622 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885300 weight_norm_u: 25.222990 loss: 0.964807 +RANK_0 - 2026-01-29 03:05:14,199 - TRAIN-LOGGER - INFO - Epoch 623 - TRAIN - Minibatch 0: weight_norm_model: 143.885300 loss: 0.964807 grad_norm_before_clip: 4.386588 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:15,446 - TRAIN-LOGGER - INFO - Epoch 623 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885300 weight_norm_u: 25.218954 loss: 0.964807 grad_norm_before_clip: 4.386588 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:15,446 - TRAIN-LOGGER - INFO - Epoch 623 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885300 weight_norm_u: 25.222990 loss: 0.964029 +RANK_0 - 2026-01-29 03:05:19,928 - TRAIN-LOGGER - INFO - Epoch 624 - TRAIN - Minibatch 0: weight_norm_model: 143.885300 loss: 0.964029 grad_norm_before_clip: 3.658406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:21,229 - TRAIN-LOGGER - INFO - Epoch 624 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885300 weight_norm_u: 25.218954 loss: 0.964029 grad_norm_before_clip: 3.658406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:21,229 - TRAIN-LOGGER - INFO - Epoch 624 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885330 weight_norm_u: 25.222990 loss: 0.965060 +RANK_0 - 2026-01-29 03:05:26,101 - TRAIN-LOGGER - INFO - Epoch 625 - TRAIN - Minibatch 0: weight_norm_model: 143.885330 loss: 0.965060 grad_norm_before_clip: 3.482693 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:27,376 - TRAIN-LOGGER - INFO - Epoch 625 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885330 weight_norm_u: 25.218954 loss: 0.965060 grad_norm_before_clip: 3.482693 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:27,377 - TRAIN-LOGGER - INFO - Epoch 625 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885345 weight_norm_u: 25.222990 loss: 0.964675 +RANK_0 - 2026-01-29 03:05:31,980 - TRAIN-LOGGER - INFO - Epoch 626 - TRAIN - Minibatch 0: weight_norm_model: 143.885345 loss: 0.964675 grad_norm_before_clip: 2.205721 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:33,135 - TRAIN-LOGGER - INFO - Epoch 626 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885345 weight_norm_u: 25.218954 loss: 0.964675 grad_norm_before_clip: 2.205721 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:33,136 - TRAIN-LOGGER - INFO - Epoch 626 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885361 weight_norm_u: 25.222990 loss: 0.963804 +RANK_0 - 2026-01-29 03:05:38,140 - TRAIN-LOGGER - INFO - Epoch 627 - TRAIN - Minibatch 0: weight_norm_model: 143.885361 loss: 0.963804 grad_norm_before_clip: 2.872704 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:39,329 - TRAIN-LOGGER - INFO - Epoch 627 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885361 weight_norm_u: 25.218954 loss: 0.963804 grad_norm_before_clip: 2.872704 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:39,330 - TRAIN-LOGGER - INFO - Epoch 627 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885361 weight_norm_u: 25.222990 loss: 0.965005 +RANK_0 - 2026-01-29 03:05:43,643 - TRAIN-LOGGER - INFO - Epoch 628 - TRAIN - Minibatch 0: weight_norm_model: 143.885361 loss: 0.965005 grad_norm_before_clip: 3.963518 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:44,953 - TRAIN-LOGGER - INFO - Epoch 628 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885361 weight_norm_u: 25.218954 loss: 0.965005 grad_norm_before_clip: 3.963518 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:44,954 - TRAIN-LOGGER - INFO - Epoch 628 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885345 weight_norm_u: 25.222990 loss: 0.964726 +RANK_0 - 2026-01-29 03:05:49,760 - TRAIN-LOGGER - INFO - Epoch 629 - TRAIN - Minibatch 0: weight_norm_model: 143.885345 loss: 0.964726 grad_norm_before_clip: 5.122533 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:50,904 - TRAIN-LOGGER - INFO - Epoch 629 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885345 weight_norm_u: 25.218954 loss: 0.964726 grad_norm_before_clip: 5.122533 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:50,904 - TRAIN-LOGGER - INFO - Epoch 629 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885361 weight_norm_u: 25.222990 loss: 0.964178 +RANK_0 - 2026-01-29 03:05:55,299 - TRAIN-LOGGER - INFO - Epoch 630 - TRAIN - Minibatch 0: weight_norm_model: 143.885361 loss: 0.964178 grad_norm_before_clip: 2.988241 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:56,478 - TRAIN-LOGGER - INFO - Epoch 630 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885361 weight_norm_u: 25.218954 loss: 0.964178 grad_norm_before_clip: 2.988241 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:05:56,478 - TRAIN-LOGGER - INFO - Epoch 630 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885361 weight_norm_u: 25.222990 loss: 0.963496 +RANK_0 - 2026-01-29 03:06:00,922 - TRAIN-LOGGER - INFO - Epoch 631 - TRAIN - Minibatch 0: weight_norm_model: 143.885361 loss: 0.963496 grad_norm_before_clip: 2.956492 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:02,067 - TRAIN-LOGGER - INFO - Epoch 631 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885361 weight_norm_u: 25.218954 loss: 0.963496 grad_norm_before_clip: 2.956492 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:02,067 - TRAIN-LOGGER - INFO - Epoch 631 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885376 weight_norm_u: 25.222990 loss: 0.962977 +RANK_0 - 2026-01-29 03:06:06,244 - TRAIN-LOGGER - INFO - Epoch 632 - TRAIN - Minibatch 0: weight_norm_model: 143.885376 loss: 0.962977 grad_norm_before_clip: 1.991159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:07,382 - TRAIN-LOGGER - INFO - Epoch 632 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885376 weight_norm_u: 25.218954 loss: 0.962977 grad_norm_before_clip: 1.991159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:07,383 - TRAIN-LOGGER - INFO - Epoch 632 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885391 weight_norm_u: 25.222990 loss: 0.962098 +RANK_0 - 2026-01-29 03:06:11,878 - TRAIN-LOGGER - INFO - Epoch 633 - TRAIN - Minibatch 0: weight_norm_model: 143.885391 loss: 0.962098 grad_norm_before_clip: 1.773060 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:13,065 - TRAIN-LOGGER - INFO - Epoch 633 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885391 weight_norm_u: 25.218954 loss: 0.962098 grad_norm_before_clip: 1.773060 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:13,066 - TRAIN-LOGGER - INFO - Epoch 633 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885391 weight_norm_u: 25.222990 loss: 0.964225 +RANK_0 - 2026-01-29 03:06:17,931 - TRAIN-LOGGER - INFO - Epoch 634 - TRAIN - Minibatch 0: weight_norm_model: 143.885391 loss: 0.964225 grad_norm_before_clip: 4.259346 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:19,136 - TRAIN-LOGGER - INFO - Epoch 634 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885391 weight_norm_u: 25.218954 loss: 0.964225 grad_norm_before_clip: 4.259346 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:19,136 - TRAIN-LOGGER - INFO - Epoch 634 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885406 weight_norm_u: 25.222990 loss: 0.964925 +RANK_0 - 2026-01-29 03:06:23,512 - TRAIN-LOGGER - INFO - Epoch 635 - TRAIN - Minibatch 0: weight_norm_model: 143.885406 loss: 0.964925 grad_norm_before_clip: 4.729537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:24,625 - TRAIN-LOGGER - INFO - Epoch 635 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885406 weight_norm_u: 25.218954 loss: 0.964925 grad_norm_before_clip: 4.729537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:24,626 - TRAIN-LOGGER - INFO - Epoch 635 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885422 weight_norm_u: 25.222990 loss: 0.963500 +RANK_0 - 2026-01-29 03:06:29,394 - TRAIN-LOGGER - INFO - Epoch 636 - TRAIN - Minibatch 0: weight_norm_model: 143.885422 loss: 0.963500 grad_norm_before_clip: 2.271981 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:30,538 - TRAIN-LOGGER - INFO - Epoch 636 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885422 weight_norm_u: 25.218954 loss: 0.963500 grad_norm_before_clip: 2.271981 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:30,539 - TRAIN-LOGGER - INFO - Epoch 636 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885452 weight_norm_u: 25.222990 loss: 0.966230 +RANK_0 - 2026-01-29 03:06:35,321 - TRAIN-LOGGER - INFO - Epoch 637 - TRAIN - Minibatch 0: weight_norm_model: 143.885452 loss: 0.966230 grad_norm_before_clip: 4.021260 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:36,569 - TRAIN-LOGGER - INFO - Epoch 637 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885452 weight_norm_u: 25.218954 loss: 0.966230 grad_norm_before_clip: 4.021260 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:36,570 - TRAIN-LOGGER - INFO - Epoch 637 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885452 weight_norm_u: 25.222990 loss: 0.966995 +RANK_0 - 2026-01-29 03:06:41,709 - TRAIN-LOGGER - INFO - Epoch 638 - TRAIN - Minibatch 0: weight_norm_model: 143.885452 loss: 0.966995 grad_norm_before_clip: 4.405296 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:42,915 - TRAIN-LOGGER - INFO - Epoch 638 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885452 weight_norm_u: 25.218954 loss: 0.966995 grad_norm_before_clip: 4.405296 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:42,915 - TRAIN-LOGGER - INFO - Epoch 638 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885452 weight_norm_u: 25.222990 loss: 0.962076 +RANK_0 - 2026-01-29 03:06:48,147 - TRAIN-LOGGER - INFO - Epoch 639 - TRAIN - Minibatch 0: weight_norm_model: 143.885452 loss: 0.962076 grad_norm_before_clip: 1.942698 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:49,348 - TRAIN-LOGGER - INFO - Epoch 639 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885452 weight_norm_u: 25.218954 loss: 0.962076 grad_norm_before_clip: 1.942698 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:49,349 - TRAIN-LOGGER - INFO - Epoch 639 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885437 weight_norm_u: 25.222990 loss: 0.965153 +RANK_0 - 2026-01-29 03:06:54,617 - TRAIN-LOGGER - INFO - Epoch 640 - TRAIN - Minibatch 0: weight_norm_model: 143.885437 loss: 0.965153 grad_norm_before_clip: 4.849922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:55,860 - TRAIN-LOGGER - INFO - Epoch 640 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885437 weight_norm_u: 25.218954 loss: 0.965153 grad_norm_before_clip: 4.849922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:06:55,861 - TRAIN-LOGGER - INFO - Epoch 640 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885437 weight_norm_u: 25.222990 loss: 0.969787 +RANK_0 - 2026-01-29 03:07:00,607 - TRAIN-LOGGER - INFO - Epoch 641 - TRAIN - Minibatch 0: weight_norm_model: 143.885437 loss: 0.969787 grad_norm_before_clip: 5.984418 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:01,737 - TRAIN-LOGGER - INFO - Epoch 641 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885437 weight_norm_u: 25.218954 loss: 0.969787 grad_norm_before_clip: 5.984418 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:01,738 - TRAIN-LOGGER - INFO - Epoch 641 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885437 weight_norm_u: 25.222990 loss: 0.965355 +RANK_0 - 2026-01-29 03:07:06,955 - TRAIN-LOGGER - INFO - Epoch 642 - TRAIN - Minibatch 0: weight_norm_model: 143.885437 loss: 0.965355 grad_norm_before_clip: 5.141895 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:08,093 - TRAIN-LOGGER - INFO - Epoch 642 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885437 weight_norm_u: 25.218954 loss: 0.965355 grad_norm_before_clip: 5.141895 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:08,094 - TRAIN-LOGGER - INFO - Epoch 642 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885468 weight_norm_u: 25.222990 loss: 0.964288 +RANK_0 - 2026-01-29 03:07:12,675 - TRAIN-LOGGER - INFO - Epoch 643 - TRAIN - Minibatch 0: weight_norm_model: 143.885468 loss: 0.964288 grad_norm_before_clip: 4.323022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:13,808 - TRAIN-LOGGER - INFO - Epoch 643 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885468 weight_norm_u: 25.218954 loss: 0.964288 grad_norm_before_clip: 4.323022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:13,809 - TRAIN-LOGGER - INFO - Epoch 643 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885483 weight_norm_u: 25.222990 loss: 0.966834 +RANK_0 - 2026-01-29 03:07:18,489 - TRAIN-LOGGER - INFO - Epoch 644 - TRAIN - Minibatch 0: weight_norm_model: 143.885483 loss: 0.966834 grad_norm_before_clip: 4.119863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:19,948 - TRAIN-LOGGER - INFO - Epoch 644 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885483 weight_norm_u: 25.218954 loss: 0.966834 grad_norm_before_clip: 4.119863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:19,948 - TRAIN-LOGGER - INFO - Epoch 644 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885483 weight_norm_u: 25.222990 loss: 0.965475 +RANK_0 - 2026-01-29 03:07:24,676 - TRAIN-LOGGER - INFO - Epoch 645 - TRAIN - Minibatch 0: weight_norm_model: 143.885483 loss: 0.965475 grad_norm_before_clip: 3.458381 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:25,880 - TRAIN-LOGGER - INFO - Epoch 645 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885483 weight_norm_u: 25.218954 loss: 0.965475 grad_norm_before_clip: 3.458381 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:25,880 - TRAIN-LOGGER - INFO - Epoch 645 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885483 weight_norm_u: 25.222990 loss: 0.962698 +RANK_0 - 2026-01-29 03:07:30,415 - TRAIN-LOGGER - INFO - Epoch 646 - TRAIN - Minibatch 0: weight_norm_model: 143.885483 loss: 0.962698 grad_norm_before_clip: 3.765989 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:31,645 - TRAIN-LOGGER - INFO - Epoch 646 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885483 weight_norm_u: 25.218954 loss: 0.962698 grad_norm_before_clip: 3.765989 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:31,645 - TRAIN-LOGGER - INFO - Epoch 646 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885468 weight_norm_u: 25.222990 loss: 0.968046 +RANK_0 - 2026-01-29 03:07:36,348 - TRAIN-LOGGER - INFO - Epoch 647 - TRAIN - Minibatch 0: weight_norm_model: 143.885468 loss: 0.968046 grad_norm_before_clip: 7.206350 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:37,586 - TRAIN-LOGGER - INFO - Epoch 647 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885468 weight_norm_u: 25.218954 loss: 0.968046 grad_norm_before_clip: 7.206350 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:37,587 - TRAIN-LOGGER - INFO - Epoch 647 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885468 weight_norm_u: 25.222990 loss: 0.972566 +RANK_0 - 2026-01-29 03:07:41,978 - TRAIN-LOGGER - INFO - Epoch 648 - TRAIN - Minibatch 0: weight_norm_model: 143.885468 loss: 0.972566 grad_norm_before_clip: 13.509171 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:43,144 - TRAIN-LOGGER - INFO - Epoch 648 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885468 weight_norm_u: 25.218954 loss: 0.972566 grad_norm_before_clip: 13.509171 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:43,144 - TRAIN-LOGGER - INFO - Epoch 648 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885483 weight_norm_u: 25.222990 loss: 0.967112 +RANK_0 - 2026-01-29 03:07:48,315 - TRAIN-LOGGER - INFO - Epoch 649 - TRAIN - Minibatch 0: weight_norm_model: 143.885483 loss: 0.967112 grad_norm_before_clip: 3.988383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:49,574 - TRAIN-LOGGER - INFO - Epoch 649 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885483 weight_norm_u: 25.218954 loss: 0.967112 grad_norm_before_clip: 3.988383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:49,574 - TRAIN-LOGGER - INFO - Epoch 649 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.964183 +RANK_0 - 2026-01-29 03:07:54,139 - TRAIN-LOGGER - INFO - Epoch 650 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.964183 grad_norm_before_clip: 2.221922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:55,298 - TRAIN-LOGGER - INFO - Epoch 650 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.964183 grad_norm_before_clip: 2.221922 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:07:55,299 - TRAIN-LOGGER - INFO - Epoch 650 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885529 weight_norm_u: 25.222990 loss: 0.968597 +RANK_0 - 2026-01-29 03:08:00,180 - TRAIN-LOGGER - INFO - Epoch 651 - TRAIN - Minibatch 0: weight_norm_model: 143.885529 loss: 0.968597 grad_norm_before_clip: 4.274971 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:01,491 - TRAIN-LOGGER - INFO - Epoch 651 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885529 weight_norm_u: 25.218954 loss: 0.968597 grad_norm_before_clip: 4.274971 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:01,491 - TRAIN-LOGGER - INFO - Epoch 651 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885529 weight_norm_u: 25.222990 loss: 0.972537 +RANK_0 - 2026-01-29 03:08:07,109 - TRAIN-LOGGER - INFO - Epoch 652 - TRAIN - Minibatch 0: weight_norm_model: 143.885529 loss: 0.972537 grad_norm_before_clip: 5.596288 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:08,308 - TRAIN-LOGGER - INFO - Epoch 652 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885529 weight_norm_u: 25.218954 loss: 0.972537 grad_norm_before_clip: 5.596288 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:08,308 - TRAIN-LOGGER - INFO - Epoch 652 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.970079 +RANK_0 - 2026-01-29 03:08:14,378 - TRAIN-LOGGER - INFO - Epoch 653 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.970079 grad_norm_before_clip: 3.750140 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:15,671 - TRAIN-LOGGER - INFO - Epoch 653 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.970079 grad_norm_before_clip: 3.750140 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:15,671 - TRAIN-LOGGER - INFO - Epoch 653 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885529 weight_norm_u: 25.222990 loss: 0.966373 +RANK_0 - 2026-01-29 03:08:21,959 - TRAIN-LOGGER - INFO - Epoch 654 - TRAIN - Minibatch 0: weight_norm_model: 143.885529 loss: 0.966373 grad_norm_before_clip: 4.635406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:23,333 - TRAIN-LOGGER - INFO - Epoch 654 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885529 weight_norm_u: 25.218954 loss: 0.966373 grad_norm_before_clip: 4.635406 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:23,333 - TRAIN-LOGGER - INFO - Epoch 654 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.963363 +RANK_0 - 2026-01-29 03:08:29,727 - TRAIN-LOGGER - INFO - Epoch 655 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.963363 grad_norm_before_clip: 2.245308 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:30,996 - TRAIN-LOGGER - INFO - Epoch 655 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.963363 grad_norm_before_clip: 2.245308 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:30,996 - TRAIN-LOGGER - INFO - Epoch 655 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.969242 +RANK_0 - 2026-01-29 03:08:36,638 - TRAIN-LOGGER - INFO - Epoch 656 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.969242 grad_norm_before_clip: 4.143558 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:37,966 - TRAIN-LOGGER - INFO - Epoch 656 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.969242 grad_norm_before_clip: 4.143558 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:37,966 - TRAIN-LOGGER - INFO - Epoch 656 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.969971 +RANK_0 - 2026-01-29 03:08:42,586 - TRAIN-LOGGER - INFO - Epoch 657 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.969971 grad_norm_before_clip: 4.541309 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:43,730 - TRAIN-LOGGER - INFO - Epoch 657 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.969971 grad_norm_before_clip: 4.541309 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:43,731 - TRAIN-LOGGER - INFO - Epoch 657 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.965428 +RANK_0 - 2026-01-29 03:08:48,249 - TRAIN-LOGGER - INFO - Epoch 658 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.965428 grad_norm_before_clip: 3.527947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:49,406 - TRAIN-LOGGER - INFO - Epoch 658 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.965428 grad_norm_before_clip: 3.527947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:49,407 - TRAIN-LOGGER - INFO - Epoch 658 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885559 weight_norm_u: 25.222990 loss: 0.963369 +RANK_0 - 2026-01-29 03:08:54,306 - TRAIN-LOGGER - INFO - Epoch 659 - TRAIN - Minibatch 0: weight_norm_model: 143.885559 loss: 0.963369 grad_norm_before_clip: 1.469943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:55,460 - TRAIN-LOGGER - INFO - Epoch 659 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885559 weight_norm_u: 25.218954 loss: 0.963369 grad_norm_before_clip: 1.469943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:08:55,461 - TRAIN-LOGGER - INFO - Epoch 659 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885574 weight_norm_u: 25.222990 loss: 0.966674 +RANK_0 - 2026-01-29 03:08:59,890 - TRAIN-LOGGER - INFO - Epoch 660 - TRAIN - Minibatch 0: weight_norm_model: 143.885574 loss: 0.966674 grad_norm_before_clip: 4.345855 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:01,070 - TRAIN-LOGGER - INFO - Epoch 660 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885574 weight_norm_u: 25.218954 loss: 0.966674 grad_norm_before_clip: 4.345855 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:01,070 - TRAIN-LOGGER - INFO - Epoch 660 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885574 weight_norm_u: 25.222990 loss: 0.968517 +RANK_0 - 2026-01-29 03:09:05,986 - TRAIN-LOGGER - INFO - Epoch 661 - TRAIN - Minibatch 0: weight_norm_model: 143.885574 loss: 0.968517 grad_norm_before_clip: 3.836508 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:07,191 - TRAIN-LOGGER - INFO - Epoch 661 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885574 weight_norm_u: 25.218954 loss: 0.968517 grad_norm_before_clip: 3.836508 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:07,191 - TRAIN-LOGGER - INFO - Epoch 661 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885559 weight_norm_u: 25.222990 loss: 0.965079 +RANK_0 - 2026-01-29 03:09:11,937 - TRAIN-LOGGER - INFO - Epoch 662 - TRAIN - Minibatch 0: weight_norm_model: 143.885559 loss: 0.965079 grad_norm_before_clip: 3.326371 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:13,281 - TRAIN-LOGGER - INFO - Epoch 662 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885559 weight_norm_u: 25.218954 loss: 0.965079 grad_norm_before_clip: 3.326371 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:13,281 - TRAIN-LOGGER - INFO - Epoch 662 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885529 weight_norm_u: 25.222990 loss: 0.962613 +RANK_0 - 2026-01-29 03:09:17,471 - TRAIN-LOGGER - INFO - Epoch 663 - TRAIN - Minibatch 0: weight_norm_model: 143.885529 loss: 0.962613 grad_norm_before_clip: 2.179836 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:18,588 - TRAIN-LOGGER - INFO - Epoch 663 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885529 weight_norm_u: 25.218954 loss: 0.962613 grad_norm_before_clip: 2.179836 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:18,588 - TRAIN-LOGGER - INFO - Epoch 663 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.964266 +RANK_0 - 2026-01-29 03:09:23,490 - TRAIN-LOGGER - INFO - Epoch 664 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.964266 grad_norm_before_clip: 2.197404 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:24,691 - TRAIN-LOGGER - INFO - Epoch 664 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.964266 grad_norm_before_clip: 2.197404 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:24,691 - TRAIN-LOGGER - INFO - Epoch 664 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.964891 +RANK_0 - 2026-01-29 03:09:29,172 - TRAIN-LOGGER - INFO - Epoch 665 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.964891 grad_norm_before_clip: 2.198852 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:30,703 - TRAIN-LOGGER - INFO - Epoch 665 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.964891 grad_norm_before_clip: 2.198852 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:30,704 - TRAIN-LOGGER - INFO - Epoch 665 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.963954 +RANK_0 - 2026-01-29 03:09:35,917 - TRAIN-LOGGER - INFO - Epoch 666 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.963954 grad_norm_before_clip: 1.435383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:37,089 - TRAIN-LOGGER - INFO - Epoch 666 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.963954 grad_norm_before_clip: 1.435383 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:37,090 - TRAIN-LOGGER - INFO - Epoch 666 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885513 weight_norm_u: 25.222990 loss: 0.963112 +RANK_0 - 2026-01-29 03:09:42,332 - TRAIN-LOGGER - INFO - Epoch 667 - TRAIN - Minibatch 0: weight_norm_model: 143.885513 loss: 0.963112 grad_norm_before_clip: 3.812502 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:43,539 - TRAIN-LOGGER - INFO - Epoch 667 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885513 weight_norm_u: 25.218954 loss: 0.963112 grad_norm_before_clip: 3.812502 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:43,539 - TRAIN-LOGGER - INFO - Epoch 667 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885529 weight_norm_u: 25.222990 loss: 0.962538 +RANK_0 - 2026-01-29 03:09:49,355 - TRAIN-LOGGER - INFO - Epoch 668 - TRAIN - Minibatch 0: weight_norm_model: 143.885529 loss: 0.962538 grad_norm_before_clip: 1.812491 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:50,505 - TRAIN-LOGGER - INFO - Epoch 668 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885529 weight_norm_u: 25.218954 loss: 0.962538 grad_norm_before_clip: 1.812491 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:50,505 - TRAIN-LOGGER - INFO - Epoch 668 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.962936 +RANK_0 - 2026-01-29 03:09:55,324 - TRAIN-LOGGER - INFO - Epoch 669 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.962936 grad_norm_before_clip: 2.971566 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:56,583 - TRAIN-LOGGER - INFO - Epoch 669 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.962936 grad_norm_before_clip: 2.971566 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:09:56,583 - TRAIN-LOGGER - INFO - Epoch 669 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.962819 +RANK_0 - 2026-01-29 03:10:01,543 - TRAIN-LOGGER - INFO - Epoch 670 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.962819 grad_norm_before_clip: 2.457800 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:02,719 - TRAIN-LOGGER - INFO - Epoch 670 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.962819 grad_norm_before_clip: 2.457800 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:02,720 - TRAIN-LOGGER - INFO - Epoch 670 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.961666 +RANK_0 - 2026-01-29 03:10:07,092 - TRAIN-LOGGER - INFO - Epoch 671 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.961666 grad_norm_before_clip: 1.594655 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:08,401 - TRAIN-LOGGER - INFO - Epoch 671 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.961666 grad_norm_before_clip: 1.594655 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:08,401 - TRAIN-LOGGER - INFO - Epoch 671 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.961834 +RANK_0 - 2026-01-29 03:10:12,839 - TRAIN-LOGGER - INFO - Epoch 672 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.961834 grad_norm_before_clip: 1.440598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:13,982 - TRAIN-LOGGER - INFO - Epoch 672 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.961834 grad_norm_before_clip: 1.440598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:13,982 - TRAIN-LOGGER - INFO - Epoch 672 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885559 weight_norm_u: 25.222990 loss: 0.962781 +RANK_0 - 2026-01-29 03:10:18,095 - TRAIN-LOGGER - INFO - Epoch 673 - TRAIN - Minibatch 0: weight_norm_model: 143.885559 loss: 0.962781 grad_norm_before_clip: 2.861608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:19,563 - TRAIN-LOGGER - INFO - Epoch 673 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885559 weight_norm_u: 25.218954 loss: 0.962781 grad_norm_before_clip: 2.861608 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:19,563 - TRAIN-LOGGER - INFO - Epoch 673 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885544 weight_norm_u: 25.222990 loss: 0.963473 +RANK_0 - 2026-01-29 03:10:23,930 - TRAIN-LOGGER - INFO - Epoch 674 - TRAIN - Minibatch 0: weight_norm_model: 143.885544 loss: 0.963473 grad_norm_before_clip: 3.178847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:25,072 - TRAIN-LOGGER - INFO - Epoch 674 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885544 weight_norm_u: 25.218954 loss: 0.963473 grad_norm_before_clip: 3.178847 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:25,072 - TRAIN-LOGGER - INFO - Epoch 674 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885559 weight_norm_u: 25.222990 loss: 0.963361 +RANK_0 - 2026-01-29 03:10:29,300 - TRAIN-LOGGER - INFO - Epoch 675 - TRAIN - Minibatch 0: weight_norm_model: 143.885559 loss: 0.963361 grad_norm_before_clip: 2.566229 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:30,836 - TRAIN-LOGGER - INFO - Epoch 675 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885559 weight_norm_u: 25.218954 loss: 0.963361 grad_norm_before_clip: 2.566229 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:30,836 - TRAIN-LOGGER - INFO - Epoch 675 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885574 weight_norm_u: 25.222990 loss: 0.962153 +RANK_0 - 2026-01-29 03:10:35,378 - TRAIN-LOGGER - INFO - Epoch 676 - TRAIN - Minibatch 0: weight_norm_model: 143.885574 loss: 0.962153 grad_norm_before_clip: 1.598189 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:36,626 - TRAIN-LOGGER - INFO - Epoch 676 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885574 weight_norm_u: 25.218954 loss: 0.962153 grad_norm_before_clip: 1.598189 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:36,626 - TRAIN-LOGGER - INFO - Epoch 676 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885605 weight_norm_u: 25.222990 loss: 0.963762 +RANK_0 - 2026-01-29 03:10:41,615 - TRAIN-LOGGER - INFO - Epoch 677 - TRAIN - Minibatch 0: weight_norm_model: 143.885605 loss: 0.963762 grad_norm_before_clip: 4.143868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:42,809 - TRAIN-LOGGER - INFO - Epoch 677 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885605 weight_norm_u: 25.218954 loss: 0.963762 grad_norm_before_clip: 4.143868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:42,809 - TRAIN-LOGGER - INFO - Epoch 677 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885635 weight_norm_u: 25.222990 loss: 0.961639 +RANK_0 - 2026-01-29 03:10:47,238 - TRAIN-LOGGER - INFO - Epoch 678 - TRAIN - Minibatch 0: weight_norm_model: 143.885635 loss: 0.961639 grad_norm_before_clip: 2.494168 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:48,378 - TRAIN-LOGGER - INFO - Epoch 678 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885635 weight_norm_u: 25.218954 loss: 0.961639 grad_norm_before_clip: 2.494168 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:48,378 - TRAIN-LOGGER - INFO - Epoch 678 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885635 weight_norm_u: 25.222990 loss: 0.963088 +RANK_0 - 2026-01-29 03:10:53,180 - TRAIN-LOGGER - INFO - Epoch 679 - TRAIN - Minibatch 0: weight_norm_model: 143.885635 loss: 0.963088 grad_norm_before_clip: 1.632785 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:54,303 - TRAIN-LOGGER - INFO - Epoch 679 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885635 weight_norm_u: 25.218954 loss: 0.963088 grad_norm_before_clip: 1.632785 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:10:54,303 - TRAIN-LOGGER - INFO - Epoch 679 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885635 weight_norm_u: 25.222990 loss: 0.965155 +RANK_0 - 2026-01-29 03:10:59,129 - TRAIN-LOGGER - INFO - Epoch 680 - TRAIN - Minibatch 0: weight_norm_model: 143.885635 loss: 0.965155 grad_norm_before_clip: 3.866305 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:00,301 - TRAIN-LOGGER - INFO - Epoch 680 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885635 weight_norm_u: 25.218954 loss: 0.965155 grad_norm_before_clip: 3.866305 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:00,301 - TRAIN-LOGGER - INFO - Epoch 680 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885651 weight_norm_u: 25.222990 loss: 0.962791 +RANK_0 - 2026-01-29 03:11:05,642 - TRAIN-LOGGER - INFO - Epoch 681 - TRAIN - Minibatch 0: weight_norm_model: 143.885651 loss: 0.962791 grad_norm_before_clip: 2.178435 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:06,816 - TRAIN-LOGGER - INFO - Epoch 681 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885651 weight_norm_u: 25.218954 loss: 0.962791 grad_norm_before_clip: 2.178435 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:06,816 - TRAIN-LOGGER - INFO - Epoch 681 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885666 weight_norm_u: 25.222990 loss: 0.963701 +RANK_0 - 2026-01-29 03:11:12,355 - TRAIN-LOGGER - INFO - Epoch 682 - TRAIN - Minibatch 0: weight_norm_model: 143.885666 loss: 0.963701 grad_norm_before_clip: 4.803771 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:13,864 - TRAIN-LOGGER - INFO - Epoch 682 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885666 weight_norm_u: 25.218954 loss: 0.963701 grad_norm_before_clip: 4.803771 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:13,865 - TRAIN-LOGGER - INFO - Epoch 682 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885681 weight_norm_u: 25.222990 loss: 0.963840 +RANK_0 - 2026-01-29 03:11:18,910 - TRAIN-LOGGER - INFO - Epoch 683 - TRAIN - Minibatch 0: weight_norm_model: 143.885681 loss: 0.963840 grad_norm_before_clip: 3.151392 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:20,181 - TRAIN-LOGGER - INFO - Epoch 683 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885681 weight_norm_u: 25.218954 loss: 0.963840 grad_norm_before_clip: 3.151392 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:20,182 - TRAIN-LOGGER - INFO - Epoch 683 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885681 weight_norm_u: 25.222990 loss: 0.963647 +RANK_0 - 2026-01-29 03:11:25,492 - TRAIN-LOGGER - INFO - Epoch 684 - TRAIN - Minibatch 0: weight_norm_model: 143.885681 loss: 0.963647 grad_norm_before_clip: 3.492518 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:26,795 - TRAIN-LOGGER - INFO - Epoch 684 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885681 weight_norm_u: 25.218954 loss: 0.963647 grad_norm_before_clip: 3.492518 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:26,795 - TRAIN-LOGGER - INFO - Epoch 684 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885666 weight_norm_u: 25.222990 loss: 0.966314 +RANK_0 - 2026-01-29 03:11:31,084 - TRAIN-LOGGER - INFO - Epoch 685 - TRAIN - Minibatch 0: weight_norm_model: 143.885666 loss: 0.966314 grad_norm_before_clip: 5.104378 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:32,329 - TRAIN-LOGGER - INFO - Epoch 685 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885666 weight_norm_u: 25.218954 loss: 0.966314 grad_norm_before_clip: 5.104378 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:32,330 - TRAIN-LOGGER - INFO - Epoch 685 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885666 weight_norm_u: 25.222990 loss: 0.968997 +RANK_0 - 2026-01-29 03:11:36,755 - TRAIN-LOGGER - INFO - Epoch 686 - TRAIN - Minibatch 0: weight_norm_model: 143.885666 loss: 0.968997 grad_norm_before_clip: 5.442566 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:37,925 - TRAIN-LOGGER - INFO - Epoch 686 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885666 weight_norm_u: 25.218954 loss: 0.968997 grad_norm_before_clip: 5.442566 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:37,926 - TRAIN-LOGGER - INFO - Epoch 686 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885681 weight_norm_u: 25.222990 loss: 0.965043 +RANK_0 - 2026-01-29 03:11:42,147 - TRAIN-LOGGER - INFO - Epoch 687 - TRAIN - Minibatch 0: weight_norm_model: 143.885681 loss: 0.965043 grad_norm_before_clip: 4.266061 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:43,413 - TRAIN-LOGGER - INFO - Epoch 687 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885681 weight_norm_u: 25.218954 loss: 0.965043 grad_norm_before_clip: 4.266061 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:43,413 - TRAIN-LOGGER - INFO - Epoch 687 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885696 weight_norm_u: 25.222990 loss: 0.964024 +RANK_0 - 2026-01-29 03:11:47,963 - TRAIN-LOGGER - INFO - Epoch 688 - TRAIN - Minibatch 0: weight_norm_model: 143.885696 loss: 0.964024 grad_norm_before_clip: 3.410780 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:49,215 - TRAIN-LOGGER - INFO - Epoch 688 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885696 weight_norm_u: 25.218954 loss: 0.964024 grad_norm_before_clip: 3.410780 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:49,216 - TRAIN-LOGGER - INFO - Epoch 688 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885712 weight_norm_u: 25.222990 loss: 0.966041 +RANK_0 - 2026-01-29 03:11:53,402 - TRAIN-LOGGER - INFO - Epoch 689 - TRAIN - Minibatch 0: weight_norm_model: 143.885712 loss: 0.966041 grad_norm_before_clip: 4.330722 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:54,527 - TRAIN-LOGGER - INFO - Epoch 689 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885712 weight_norm_u: 25.218954 loss: 0.966041 grad_norm_before_clip: 4.330722 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:11:54,527 - TRAIN-LOGGER - INFO - Epoch 689 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885712 weight_norm_u: 25.222990 loss: 0.965929 +RANK_0 - 2026-01-29 03:11:59,874 - TRAIN-LOGGER - INFO - Epoch 690 - TRAIN - Minibatch 0: weight_norm_model: 143.885712 loss: 0.965929 grad_norm_before_clip: 3.201551 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:01,460 - TRAIN-LOGGER - INFO - Epoch 690 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885712 weight_norm_u: 25.218954 loss: 0.965929 grad_norm_before_clip: 3.201551 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:01,460 - TRAIN-LOGGER - INFO - Epoch 690 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885712 weight_norm_u: 25.222990 loss: 0.965191 +RANK_0 - 2026-01-29 03:12:06,202 - TRAIN-LOGGER - INFO - Epoch 691 - TRAIN - Minibatch 0: weight_norm_model: 143.885712 loss: 0.965191 grad_norm_before_clip: 3.762902 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:07,784 - TRAIN-LOGGER - INFO - Epoch 691 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885712 weight_norm_u: 25.218954 loss: 0.965191 grad_norm_before_clip: 3.762902 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:07,784 - TRAIN-LOGGER - INFO - Epoch 691 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885696 weight_norm_u: 25.222990 loss: 0.966393 +RANK_0 - 2026-01-29 03:12:11,946 - TRAIN-LOGGER - INFO - Epoch 692 - TRAIN - Minibatch 0: weight_norm_model: 143.885696 loss: 0.966393 grad_norm_before_clip: 3.917274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:13,146 - TRAIN-LOGGER - INFO - Epoch 692 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885696 weight_norm_u: 25.218954 loss: 0.966393 grad_norm_before_clip: 3.917274 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:13,146 - TRAIN-LOGGER - INFO - Epoch 692 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885696 weight_norm_u: 25.222990 loss: 0.966512 +RANK_0 - 2026-01-29 03:12:17,420 - TRAIN-LOGGER - INFO - Epoch 693 - TRAIN - Minibatch 0: weight_norm_model: 143.885696 loss: 0.966512 grad_norm_before_clip: 3.571727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:18,653 - TRAIN-LOGGER - INFO - Epoch 693 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885696 weight_norm_u: 25.218954 loss: 0.966512 grad_norm_before_clip: 3.571727 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:18,654 - TRAIN-LOGGER - INFO - Epoch 693 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885696 weight_norm_u: 25.222990 loss: 0.964863 +RANK_0 - 2026-01-29 03:12:23,740 - TRAIN-LOGGER - INFO - Epoch 694 - TRAIN - Minibatch 0: weight_norm_model: 143.885696 loss: 0.964863 grad_norm_before_clip: 2.253874 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:24,964 - TRAIN-LOGGER - INFO - Epoch 694 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885696 weight_norm_u: 25.218954 loss: 0.964863 grad_norm_before_clip: 2.253874 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:24,964 - TRAIN-LOGGER - INFO - Epoch 694 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885696 weight_norm_u: 25.222990 loss: 0.963517 +RANK_0 - 2026-01-29 03:12:29,828 - TRAIN-LOGGER - INFO - Epoch 695 - TRAIN - Minibatch 0: weight_norm_model: 143.885696 loss: 0.963517 grad_norm_before_clip: 2.124617 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:31,353 - TRAIN-LOGGER - INFO - Epoch 695 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885696 weight_norm_u: 25.218954 loss: 0.963517 grad_norm_before_clip: 2.124617 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:31,353 - TRAIN-LOGGER - INFO - Epoch 695 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885727 weight_norm_u: 25.222990 loss: 0.964644 +RANK_0 - 2026-01-29 03:12:35,750 - TRAIN-LOGGER - INFO - Epoch 696 - TRAIN - Minibatch 0: weight_norm_model: 143.885727 loss: 0.964644 grad_norm_before_clip: 2.766526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:36,922 - TRAIN-LOGGER - INFO - Epoch 696 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885727 weight_norm_u: 25.218954 loss: 0.964644 grad_norm_before_clip: 2.766526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:36,922 - TRAIN-LOGGER - INFO - Epoch 696 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885727 weight_norm_u: 25.222990 loss: 0.963592 +RANK_0 - 2026-01-29 03:12:42,822 - TRAIN-LOGGER - INFO - Epoch 697 - TRAIN - Minibatch 0: weight_norm_model: 143.885727 loss: 0.963592 grad_norm_before_clip: 3.765746 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:43,963 - TRAIN-LOGGER - INFO - Epoch 697 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885727 weight_norm_u: 25.218954 loss: 0.963592 grad_norm_before_clip: 3.765746 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:43,963 - TRAIN-LOGGER - INFO - Epoch 697 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885727 weight_norm_u: 25.222990 loss: 0.962537 +RANK_0 - 2026-01-29 03:12:48,692 - TRAIN-LOGGER - INFO - Epoch 698 - TRAIN - Minibatch 0: weight_norm_model: 143.885727 loss: 0.962537 grad_norm_before_clip: 3.464380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:49,984 - TRAIN-LOGGER - INFO - Epoch 698 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885727 weight_norm_u: 25.218954 loss: 0.962537 grad_norm_before_clip: 3.464380 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:49,984 - TRAIN-LOGGER - INFO - Epoch 698 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885727 weight_norm_u: 25.222990 loss: 0.963557 +RANK_0 - 2026-01-29 03:12:54,529 - TRAIN-LOGGER - INFO - Epoch 699 - TRAIN - Minibatch 0: weight_norm_model: 143.885727 loss: 0.963557 grad_norm_before_clip: 4.538889 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:55,827 - TRAIN-LOGGER - INFO - Epoch 699 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885727 weight_norm_u: 25.218954 loss: 0.963557 grad_norm_before_clip: 4.538889 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:12:55,827 - TRAIN-LOGGER - INFO - Epoch 699 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885727 weight_norm_u: 25.222990 loss: 0.964884 +RANK_0 - 2026-01-29 03:13:00,301 - TRAIN-LOGGER - INFO - Epoch 700 - TRAIN - Minibatch 0: weight_norm_model: 143.885727 loss: 0.964884 grad_norm_before_clip: 5.065580 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:01,473 - TRAIN-LOGGER - INFO - Epoch 700 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885727 weight_norm_u: 25.218954 loss: 0.964884 grad_norm_before_clip: 5.065580 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:01,473 - TRAIN-LOGGER - INFO - Epoch 700 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885742 weight_norm_u: 25.222990 loss: 0.962554 +RANK_0 - 2026-01-29 03:13:06,414 - TRAIN-LOGGER - INFO - Epoch 701 - TRAIN - Minibatch 0: weight_norm_model: 143.885742 loss: 0.962554 grad_norm_before_clip: 2.963479 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:07,561 - TRAIN-LOGGER - INFO - Epoch 701 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885742 weight_norm_u: 25.218954 loss: 0.962554 grad_norm_before_clip: 2.963479 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:07,561 - TRAIN-LOGGER - INFO - Epoch 701 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885757 weight_norm_u: 25.222990 loss: 0.961838 +RANK_0 - 2026-01-29 03:13:12,181 - TRAIN-LOGGER - INFO - Epoch 702 - TRAIN - Minibatch 0: weight_norm_model: 143.885757 loss: 0.961838 grad_norm_before_clip: 1.927572 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:13,449 - TRAIN-LOGGER - INFO - Epoch 702 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885757 weight_norm_u: 25.218954 loss: 0.961838 grad_norm_before_clip: 1.927572 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:13,449 - TRAIN-LOGGER - INFO - Epoch 702 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885757 weight_norm_u: 25.222990 loss: 0.961253 +RANK_0 - 2026-01-29 03:13:18,372 - TRAIN-LOGGER - INFO - Epoch 703 - TRAIN - Minibatch 0: weight_norm_model: 143.885757 loss: 0.961253 grad_norm_before_clip: 1.557075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:19,479 - TRAIN-LOGGER - INFO - Epoch 703 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885757 weight_norm_u: 25.218954 loss: 0.961253 grad_norm_before_clip: 1.557075 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:19,479 - TRAIN-LOGGER - INFO - Epoch 703 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885773 weight_norm_u: 25.222990 loss: 0.961555 +RANK_0 - 2026-01-29 03:13:24,036 - TRAIN-LOGGER - INFO - Epoch 704 - TRAIN - Minibatch 0: weight_norm_model: 143.885773 loss: 0.961555 grad_norm_before_clip: 1.518224 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:25,270 - TRAIN-LOGGER - INFO - Epoch 704 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885773 weight_norm_u: 25.218954 loss: 0.961555 grad_norm_before_clip: 1.518224 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:25,271 - TRAIN-LOGGER - INFO - Epoch 704 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885773 weight_norm_u: 25.222990 loss: 0.966295 +RANK_0 - 2026-01-29 03:13:30,162 - TRAIN-LOGGER - INFO - Epoch 705 - TRAIN - Minibatch 0: weight_norm_model: 143.885773 loss: 0.966295 grad_norm_before_clip: 4.375960 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:31,354 - TRAIN-LOGGER - INFO - Epoch 705 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885773 weight_norm_u: 25.218954 loss: 0.966295 grad_norm_before_clip: 4.375960 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:31,355 - TRAIN-LOGGER - INFO - Epoch 705 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885773 weight_norm_u: 25.222990 loss: 0.965310 +RANK_0 - 2026-01-29 03:13:35,804 - TRAIN-LOGGER - INFO - Epoch 706 - TRAIN - Minibatch 0: weight_norm_model: 143.885773 loss: 0.965310 grad_norm_before_clip: 4.226652 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:36,988 - TRAIN-LOGGER - INFO - Epoch 706 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885773 weight_norm_u: 25.218954 loss: 0.965310 grad_norm_before_clip: 4.226652 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:36,988 - TRAIN-LOGGER - INFO - Epoch 706 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885773 weight_norm_u: 25.222990 loss: 0.964803 +RANK_0 - 2026-01-29 03:13:42,078 - TRAIN-LOGGER - INFO - Epoch 707 - TRAIN - Minibatch 0: weight_norm_model: 143.885773 loss: 0.964803 grad_norm_before_clip: 4.448423 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:43,208 - TRAIN-LOGGER - INFO - Epoch 707 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885773 weight_norm_u: 25.218954 loss: 0.964803 grad_norm_before_clip: 4.448423 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:43,208 - TRAIN-LOGGER - INFO - Epoch 707 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885788 weight_norm_u: 25.222990 loss: 0.963649 +RANK_0 - 2026-01-29 03:13:47,728 - TRAIN-LOGGER - INFO - Epoch 708 - TRAIN - Minibatch 0: weight_norm_model: 143.885788 loss: 0.963649 grad_norm_before_clip: 4.416857 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:48,912 - TRAIN-LOGGER - INFO - Epoch 708 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885788 weight_norm_u: 25.218954 loss: 0.963649 grad_norm_before_clip: 4.416857 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:48,912 - TRAIN-LOGGER - INFO - Epoch 708 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.962198 +RANK_0 - 2026-01-29 03:13:53,990 - TRAIN-LOGGER - INFO - Epoch 709 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.962198 grad_norm_before_clip: 2.438526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:55,149 - TRAIN-LOGGER - INFO - Epoch 709 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.962198 grad_norm_before_clip: 2.438526 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:13:55,149 - TRAIN-LOGGER - INFO - Epoch 709 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.962348 +RANK_0 - 2026-01-29 03:13:59,722 - TRAIN-LOGGER - INFO - Epoch 710 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.962348 grad_norm_before_clip: 2.495780 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:01,261 - TRAIN-LOGGER - INFO - Epoch 710 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.962348 grad_norm_before_clip: 2.495780 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:01,261 - TRAIN-LOGGER - INFO - Epoch 710 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885803 weight_norm_u: 25.222990 loss: 0.962263 +RANK_0 - 2026-01-29 03:14:06,079 - TRAIN-LOGGER - INFO - Epoch 711 - TRAIN - Minibatch 0: weight_norm_model: 143.885803 loss: 0.962263 grad_norm_before_clip: 3.615631 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:07,235 - TRAIN-LOGGER - INFO - Epoch 711 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885803 weight_norm_u: 25.218954 loss: 0.962263 grad_norm_before_clip: 3.615631 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:07,235 - TRAIN-LOGGER - INFO - Epoch 711 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885788 weight_norm_u: 25.222990 loss: 0.965363 +RANK_0 - 2026-01-29 03:14:12,679 - TRAIN-LOGGER - INFO - Epoch 712 - TRAIN - Minibatch 0: weight_norm_model: 143.885788 loss: 0.965363 grad_norm_before_clip: 5.068146 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:13,950 - TRAIN-LOGGER - INFO - Epoch 712 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885788 weight_norm_u: 25.218954 loss: 0.965363 grad_norm_before_clip: 5.068146 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:13,951 - TRAIN-LOGGER - INFO - Epoch 712 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885788 weight_norm_u: 25.222990 loss: 0.964147 +RANK_0 - 2026-01-29 03:14:18,409 - TRAIN-LOGGER - INFO - Epoch 713 - TRAIN - Minibatch 0: weight_norm_model: 143.885788 loss: 0.964147 grad_norm_before_clip: 3.273848 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:19,673 - TRAIN-LOGGER - INFO - Epoch 713 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885788 weight_norm_u: 25.218954 loss: 0.964147 grad_norm_before_clip: 3.273848 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:19,673 - TRAIN-LOGGER - INFO - Epoch 713 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885803 weight_norm_u: 25.222990 loss: 0.964454 +RANK_0 - 2026-01-29 03:14:24,746 - TRAIN-LOGGER - INFO - Epoch 714 - TRAIN - Minibatch 0: weight_norm_model: 143.885803 loss: 0.964454 grad_norm_before_clip: 3.431954 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:25,985 - TRAIN-LOGGER - INFO - Epoch 714 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885803 weight_norm_u: 25.218954 loss: 0.964454 grad_norm_before_clip: 3.431954 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:25,986 - TRAIN-LOGGER - INFO - Epoch 714 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.963678 +RANK_0 - 2026-01-29 03:14:30,557 - TRAIN-LOGGER - INFO - Epoch 715 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.963678 grad_norm_before_clip: 3.776446 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:31,735 - TRAIN-LOGGER - INFO - Epoch 715 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.963678 grad_norm_before_clip: 3.776446 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:31,735 - TRAIN-LOGGER - INFO - Epoch 715 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885834 weight_norm_u: 25.222990 loss: 0.963965 +RANK_0 - 2026-01-29 03:14:37,264 - TRAIN-LOGGER - INFO - Epoch 716 - TRAIN - Minibatch 0: weight_norm_model: 143.885834 loss: 0.963965 grad_norm_before_clip: 2.388425 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:38,567 - TRAIN-LOGGER - INFO - Epoch 716 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885834 weight_norm_u: 25.218954 loss: 0.963965 grad_norm_before_clip: 2.388425 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:38,567 - TRAIN-LOGGER - INFO - Epoch 716 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.964112 +RANK_0 - 2026-01-29 03:14:43,354 - TRAIN-LOGGER - INFO - Epoch 717 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.964112 grad_norm_before_clip: 3.293166 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:44,521 - TRAIN-LOGGER - INFO - Epoch 717 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.964112 grad_norm_before_clip: 3.293166 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:44,521 - TRAIN-LOGGER - INFO - Epoch 717 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.962428 +RANK_0 - 2026-01-29 03:14:49,509 - TRAIN-LOGGER - INFO - Epoch 718 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.962428 grad_norm_before_clip: 1.788147 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:50,679 - TRAIN-LOGGER - INFO - Epoch 718 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.962428 grad_norm_before_clip: 1.788147 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:50,680 - TRAIN-LOGGER - INFO - Epoch 718 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885803 weight_norm_u: 25.222990 loss: 0.964383 +RANK_0 - 2026-01-29 03:14:55,327 - TRAIN-LOGGER - INFO - Epoch 719 - TRAIN - Minibatch 0: weight_norm_model: 143.885803 loss: 0.964383 grad_norm_before_clip: 6.016691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:56,617 - TRAIN-LOGGER - INFO - Epoch 719 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885803 weight_norm_u: 25.218954 loss: 0.964383 grad_norm_before_clip: 6.016691 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:14:56,617 - TRAIN-LOGGER - INFO - Epoch 719 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.966290 +RANK_0 - 2026-01-29 03:15:01,756 - TRAIN-LOGGER - INFO - Epoch 720 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.966290 grad_norm_before_clip: 5.959801 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:02,982 - TRAIN-LOGGER - INFO - Epoch 720 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.966290 grad_norm_before_clip: 5.959801 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:02,982 - TRAIN-LOGGER - INFO - Epoch 720 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885818 weight_norm_u: 25.222990 loss: 0.963001 +RANK_0 - 2026-01-29 03:15:07,852 - TRAIN-LOGGER - INFO - Epoch 721 - TRAIN - Minibatch 0: weight_norm_model: 143.885818 loss: 0.963001 grad_norm_before_clip: 3.197654 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:09,145 - TRAIN-LOGGER - INFO - Epoch 721 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885818 weight_norm_u: 25.218954 loss: 0.963001 grad_norm_before_clip: 3.197654 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:09,146 - TRAIN-LOGGER - INFO - Epoch 721 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885834 weight_norm_u: 25.222990 loss: 0.964451 +RANK_0 - 2026-01-29 03:15:13,670 - TRAIN-LOGGER - INFO - Epoch 722 - TRAIN - Minibatch 0: weight_norm_model: 143.885834 loss: 0.964451 grad_norm_before_clip: 4.898472 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:15,024 - TRAIN-LOGGER - INFO - Epoch 722 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885834 weight_norm_u: 25.218954 loss: 0.964451 grad_norm_before_clip: 4.898472 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:15,024 - TRAIN-LOGGER - INFO - Epoch 722 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885849 weight_norm_u: 25.222990 loss: 0.966455 +RANK_0 - 2026-01-29 03:15:19,914 - TRAIN-LOGGER - INFO - Epoch 723 - TRAIN - Minibatch 0: weight_norm_model: 143.885849 loss: 0.966455 grad_norm_before_clip: 6.152586 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:21,341 - TRAIN-LOGGER - INFO - Epoch 723 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885849 weight_norm_u: 25.218954 loss: 0.966455 grad_norm_before_clip: 6.152586 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:21,341 - TRAIN-LOGGER - INFO - Epoch 723 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885864 weight_norm_u: 25.222990 loss: 0.963764 +RANK_0 - 2026-01-29 03:15:26,523 - TRAIN-LOGGER - INFO - Epoch 724 - TRAIN - Minibatch 0: weight_norm_model: 143.885864 loss: 0.963764 grad_norm_before_clip: 4.395239 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:27,698 - TRAIN-LOGGER - INFO - Epoch 724 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885864 weight_norm_u: 25.218954 loss: 0.963764 grad_norm_before_clip: 4.395239 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:27,699 - TRAIN-LOGGER - INFO - Epoch 724 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885864 weight_norm_u: 25.222990 loss: 0.964122 +RANK_0 - 2026-01-29 03:15:31,935 - TRAIN-LOGGER - INFO - Epoch 725 - TRAIN - Minibatch 0: weight_norm_model: 143.885864 loss: 0.964122 grad_norm_before_clip: 3.837469 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:33,085 - TRAIN-LOGGER - INFO - Epoch 725 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885864 weight_norm_u: 25.218954 loss: 0.964122 grad_norm_before_clip: 3.837469 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:33,086 - TRAIN-LOGGER - INFO - Epoch 725 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885864 weight_norm_u: 25.222990 loss: 0.965231 +RANK_0 - 2026-01-29 03:15:38,154 - TRAIN-LOGGER - INFO - Epoch 726 - TRAIN - Minibatch 0: weight_norm_model: 143.885864 loss: 0.965231 grad_norm_before_clip: 5.068656 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:39,323 - TRAIN-LOGGER - INFO - Epoch 726 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885864 weight_norm_u: 25.218954 loss: 0.965231 grad_norm_before_clip: 5.068656 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:39,323 - TRAIN-LOGGER - INFO - Epoch 726 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885880 weight_norm_u: 25.222990 loss: 0.961606 +RANK_0 - 2026-01-29 03:15:43,787 - TRAIN-LOGGER - INFO - Epoch 727 - TRAIN - Minibatch 0: weight_norm_model: 143.885880 loss: 0.961606 grad_norm_before_clip: 3.382762 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:44,987 - TRAIN-LOGGER - INFO - Epoch 727 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885880 weight_norm_u: 25.218954 loss: 0.961606 grad_norm_before_clip: 3.382762 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:44,988 - TRAIN-LOGGER - INFO - Epoch 727 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885880 weight_norm_u: 25.222990 loss: 0.962647 +RANK_0 - 2026-01-29 03:15:50,436 - TRAIN-LOGGER - INFO - Epoch 728 - TRAIN - Minibatch 0: weight_norm_model: 143.885880 loss: 0.962647 grad_norm_before_clip: 2.596074 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:51,802 - TRAIN-LOGGER - INFO - Epoch 728 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885880 weight_norm_u: 25.218954 loss: 0.962647 grad_norm_before_clip: 2.596074 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:51,803 - TRAIN-LOGGER - INFO - Epoch 728 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885880 weight_norm_u: 25.222990 loss: 0.963787 +RANK_0 - 2026-01-29 03:15:56,022 - TRAIN-LOGGER - INFO - Epoch 729 - TRAIN - Minibatch 0: weight_norm_model: 143.885880 loss: 0.963787 grad_norm_before_clip: 3.526947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:57,208 - TRAIN-LOGGER - INFO - Epoch 729 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885880 weight_norm_u: 25.218954 loss: 0.963787 grad_norm_before_clip: 3.526947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:15:57,208 - TRAIN-LOGGER - INFO - Epoch 729 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885880 weight_norm_u: 25.222990 loss: 0.961160 +RANK_0 - 2026-01-29 03:16:02,501 - TRAIN-LOGGER - INFO - Epoch 730 - TRAIN - Minibatch 0: weight_norm_model: 143.885880 loss: 0.961160 grad_norm_before_clip: 2.012887 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:03,797 - TRAIN-LOGGER - INFO - Epoch 730 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885880 weight_norm_u: 25.218954 loss: 0.961160 grad_norm_before_clip: 2.012887 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:03,798 - TRAIN-LOGGER - INFO - Epoch 730 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885895 weight_norm_u: 25.222990 loss: 0.964981 +RANK_0 - 2026-01-29 03:16:08,790 - TRAIN-LOGGER - INFO - Epoch 731 - TRAIN - Minibatch 0: weight_norm_model: 143.885895 loss: 0.964981 grad_norm_before_clip: 5.270409 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:10,057 - TRAIN-LOGGER - INFO - Epoch 731 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885895 weight_norm_u: 25.218954 loss: 0.964981 grad_norm_before_clip: 5.270409 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:10,057 - TRAIN-LOGGER - INFO - Epoch 731 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885895 weight_norm_u: 25.222990 loss: 0.965082 +RANK_0 - 2026-01-29 03:16:14,926 - TRAIN-LOGGER - INFO - Epoch 732 - TRAIN - Minibatch 0: weight_norm_model: 143.885895 loss: 0.965082 grad_norm_before_clip: 5.136226 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:16,200 - TRAIN-LOGGER - INFO - Epoch 732 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885895 weight_norm_u: 25.218954 loss: 0.965082 grad_norm_before_clip: 5.136226 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:16,200 - TRAIN-LOGGER - INFO - Epoch 732 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885910 weight_norm_u: 25.222990 loss: 0.962949 +RANK_0 - 2026-01-29 03:16:20,451 - TRAIN-LOGGER - INFO - Epoch 733 - TRAIN - Minibatch 0: weight_norm_model: 143.885910 loss: 0.962949 grad_norm_before_clip: 4.337924 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:21,689 - TRAIN-LOGGER - INFO - Epoch 733 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885910 weight_norm_u: 25.218954 loss: 0.962949 grad_norm_before_clip: 4.337924 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:21,689 - TRAIN-LOGGER - INFO - Epoch 733 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885910 weight_norm_u: 25.222990 loss: 0.964342 +RANK_0 - 2026-01-29 03:16:27,002 - TRAIN-LOGGER - INFO - Epoch 734 - TRAIN - Minibatch 0: weight_norm_model: 143.885910 loss: 0.964342 grad_norm_before_clip: 4.109178 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:28,303 - TRAIN-LOGGER - INFO - Epoch 734 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885910 weight_norm_u: 25.218954 loss: 0.964342 grad_norm_before_clip: 4.109178 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:28,304 - TRAIN-LOGGER - INFO - Epoch 734 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885910 weight_norm_u: 25.222990 loss: 0.966212 +RANK_0 - 2026-01-29 03:16:33,339 - TRAIN-LOGGER - INFO - Epoch 735 - TRAIN - Minibatch 0: weight_norm_model: 143.885910 loss: 0.966212 grad_norm_before_clip: 3.931509 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:34,737 - TRAIN-LOGGER - INFO - Epoch 735 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885910 weight_norm_u: 25.218954 loss: 0.966212 grad_norm_before_clip: 3.931509 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:34,738 - TRAIN-LOGGER - INFO - Epoch 735 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885910 weight_norm_u: 25.222990 loss: 0.965067 +RANK_0 - 2026-01-29 03:16:39,732 - TRAIN-LOGGER - INFO - Epoch 736 - TRAIN - Minibatch 0: weight_norm_model: 143.885910 loss: 0.965067 grad_norm_before_clip: 3.775142 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:40,857 - TRAIN-LOGGER - INFO - Epoch 736 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885910 weight_norm_u: 25.218954 loss: 0.965067 grad_norm_before_clip: 3.775142 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:40,858 - TRAIN-LOGGER - INFO - Epoch 736 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885910 weight_norm_u: 25.222990 loss: 0.962737 +RANK_0 - 2026-01-29 03:16:45,437 - TRAIN-LOGGER - INFO - Epoch 737 - TRAIN - Minibatch 0: weight_norm_model: 143.885910 loss: 0.962737 grad_norm_before_clip: 1.517082 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:46,652 - TRAIN-LOGGER - INFO - Epoch 737 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885910 weight_norm_u: 25.218954 loss: 0.962737 grad_norm_before_clip: 1.517082 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:46,652 - TRAIN-LOGGER - INFO - Epoch 737 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885925 weight_norm_u: 25.222990 loss: 0.963772 +RANK_0 - 2026-01-29 03:16:51,568 - TRAIN-LOGGER - INFO - Epoch 738 - TRAIN - Minibatch 0: weight_norm_model: 143.885925 loss: 0.963772 grad_norm_before_clip: 4.719318 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:52,826 - TRAIN-LOGGER - INFO - Epoch 738 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885925 weight_norm_u: 25.218954 loss: 0.963772 grad_norm_before_clip: 4.719318 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:52,827 - TRAIN-LOGGER - INFO - Epoch 738 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885941 weight_norm_u: 25.222990 loss: 0.961745 +RANK_0 - 2026-01-29 03:16:57,128 - TRAIN-LOGGER - INFO - Epoch 739 - TRAIN - Minibatch 0: weight_norm_model: 143.885941 loss: 0.961745 grad_norm_before_clip: 1.815764 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:58,267 - TRAIN-LOGGER - INFO - Epoch 739 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885941 weight_norm_u: 25.218954 loss: 0.961745 grad_norm_before_clip: 1.815764 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:16:58,267 - TRAIN-LOGGER - INFO - Epoch 739 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885925 weight_norm_u: 25.222990 loss: 0.961226 +RANK_0 - 2026-01-29 03:17:03,177 - TRAIN-LOGGER - INFO - Epoch 740 - TRAIN - Minibatch 0: weight_norm_model: 143.885925 loss: 0.961226 grad_norm_before_clip: 1.692562 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:04,374 - TRAIN-LOGGER - INFO - Epoch 740 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885925 weight_norm_u: 25.218954 loss: 0.961226 grad_norm_before_clip: 1.692562 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:04,374 - TRAIN-LOGGER - INFO - Epoch 740 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885941 weight_norm_u: 25.222990 loss: 0.963147 +RANK_0 - 2026-01-29 03:17:08,673 - TRAIN-LOGGER - INFO - Epoch 741 - TRAIN - Minibatch 0: weight_norm_model: 143.885941 loss: 0.963147 grad_norm_before_clip: 4.172386 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:09,897 - TRAIN-LOGGER - INFO - Epoch 741 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885941 weight_norm_u: 25.218954 loss: 0.963147 grad_norm_before_clip: 4.172386 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:09,898 - TRAIN-LOGGER - INFO - Epoch 741 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885941 weight_norm_u: 25.222990 loss: 0.963288 +RANK_0 - 2026-01-29 03:17:14,699 - TRAIN-LOGGER - INFO - Epoch 742 - TRAIN - Minibatch 0: weight_norm_model: 143.885941 loss: 0.963288 grad_norm_before_clip: 2.166111 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:15,899 - TRAIN-LOGGER - INFO - Epoch 742 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885941 weight_norm_u: 25.218954 loss: 0.963288 grad_norm_before_clip: 2.166111 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:15,900 - TRAIN-LOGGER - INFO - Epoch 742 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885971 weight_norm_u: 25.222990 loss: 0.963102 +RANK_0 - 2026-01-29 03:17:20,943 - TRAIN-LOGGER - INFO - Epoch 743 - TRAIN - Minibatch 0: weight_norm_model: 143.885971 loss: 0.963102 grad_norm_before_clip: 2.873231 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:22,203 - TRAIN-LOGGER - INFO - Epoch 743 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885971 weight_norm_u: 25.218954 loss: 0.963102 grad_norm_before_clip: 2.873231 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:22,203 - TRAIN-LOGGER - INFO - Epoch 743 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885986 weight_norm_u: 25.222990 loss: 0.964157 +RANK_0 - 2026-01-29 03:17:26,545 - TRAIN-LOGGER - INFO - Epoch 744 - TRAIN - Minibatch 0: weight_norm_model: 143.885986 loss: 0.964157 grad_norm_before_clip: 2.771243 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:28,091 - TRAIN-LOGGER - INFO - Epoch 744 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885986 weight_norm_u: 25.218954 loss: 0.964157 grad_norm_before_clip: 2.771243 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:28,092 - TRAIN-LOGGER - INFO - Epoch 744 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885986 weight_norm_u: 25.222990 loss: 0.963150 +RANK_0 - 2026-01-29 03:17:33,410 - TRAIN-LOGGER - INFO - Epoch 745 - TRAIN - Minibatch 0: weight_norm_model: 143.885986 loss: 0.963150 grad_norm_before_clip: 2.645145 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:34,584 - TRAIN-LOGGER - INFO - Epoch 745 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885986 weight_norm_u: 25.218954 loss: 0.963150 grad_norm_before_clip: 2.645145 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:34,584 - TRAIN-LOGGER - INFO - Epoch 745 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885971 weight_norm_u: 25.222990 loss: 0.962317 +RANK_0 - 2026-01-29 03:17:39,691 - TRAIN-LOGGER - INFO - Epoch 746 - TRAIN - Minibatch 0: weight_norm_model: 143.885971 loss: 0.962317 grad_norm_before_clip: 3.770143 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:41,514 - TRAIN-LOGGER - INFO - Epoch 746 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885971 weight_norm_u: 25.218954 loss: 0.962317 grad_norm_before_clip: 3.770143 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:41,514 - TRAIN-LOGGER - INFO - Epoch 746 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885971 weight_norm_u: 25.222990 loss: 0.963586 +RANK_0 - 2026-01-29 03:17:47,005 - TRAIN-LOGGER - INFO - Epoch 747 - TRAIN - Minibatch 0: weight_norm_model: 143.885971 loss: 0.963586 grad_norm_before_clip: 3.795947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:48,223 - TRAIN-LOGGER - INFO - Epoch 747 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885971 weight_norm_u: 25.218954 loss: 0.963586 grad_norm_before_clip: 3.795947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:48,223 - TRAIN-LOGGER - INFO - Epoch 747 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885986 weight_norm_u: 25.222990 loss: 0.961863 +RANK_0 - 2026-01-29 03:17:52,865 - TRAIN-LOGGER - INFO - Epoch 748 - TRAIN - Minibatch 0: weight_norm_model: 143.885986 loss: 0.961863 grad_norm_before_clip: 1.385741 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:54,405 - TRAIN-LOGGER - INFO - Epoch 748 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885986 weight_norm_u: 25.218954 loss: 0.961863 grad_norm_before_clip: 1.385741 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:17:54,405 - TRAIN-LOGGER - INFO - Epoch 748 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886002 weight_norm_u: 25.222990 loss: 0.963502 +RANK_0 - 2026-01-29 03:17:59,051 - TRAIN-LOGGER - INFO - Epoch 749 - TRAIN - Minibatch 0: weight_norm_model: 143.886002 loss: 0.963502 grad_norm_before_clip: 4.217504 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:00,172 - TRAIN-LOGGER - INFO - Epoch 749 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886002 weight_norm_u: 25.218954 loss: 0.963502 grad_norm_before_clip: 4.217504 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:00,172 - TRAIN-LOGGER - INFO - Epoch 749 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885986 weight_norm_u: 25.222990 loss: 0.964081 +RANK_0 - 2026-01-29 03:18:04,486 - TRAIN-LOGGER - INFO - Epoch 750 - TRAIN - Minibatch 0: weight_norm_model: 143.885986 loss: 0.964081 grad_norm_before_clip: 3.466592 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:06,043 - TRAIN-LOGGER - INFO - Epoch 750 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885986 weight_norm_u: 25.218954 loss: 0.964081 grad_norm_before_clip: 3.466592 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:06,043 - TRAIN-LOGGER - INFO - Epoch 750 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885986 weight_norm_u: 25.222990 loss: 0.962357 +RANK_0 - 2026-01-29 03:18:10,365 - TRAIN-LOGGER - INFO - Epoch 751 - TRAIN - Minibatch 0: weight_norm_model: 143.885986 loss: 0.962357 grad_norm_before_clip: 1.837129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:11,479 - TRAIN-LOGGER - INFO - Epoch 751 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885986 weight_norm_u: 25.218954 loss: 0.962357 grad_norm_before_clip: 1.837129 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:11,479 - TRAIN-LOGGER - INFO - Epoch 751 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.885986 weight_norm_u: 25.222990 loss: 0.962865 +RANK_0 - 2026-01-29 03:18:15,708 - TRAIN-LOGGER - INFO - Epoch 752 - TRAIN - Minibatch 0: weight_norm_model: 143.885986 loss: 0.962865 grad_norm_before_clip: 4.296082 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:16,876 - TRAIN-LOGGER - INFO - Epoch 752 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.885986 weight_norm_u: 25.218954 loss: 0.962865 grad_norm_before_clip: 4.296082 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:16,876 - TRAIN-LOGGER - INFO - Epoch 752 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886002 weight_norm_u: 25.222990 loss: 0.964348 +RANK_0 - 2026-01-29 03:18:22,082 - TRAIN-LOGGER - INFO - Epoch 753 - TRAIN - Minibatch 0: weight_norm_model: 143.886002 loss: 0.964348 grad_norm_before_clip: 3.831466 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:23,207 - TRAIN-LOGGER - INFO - Epoch 753 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886002 weight_norm_u: 25.218954 loss: 0.964348 grad_norm_before_clip: 3.831466 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:23,207 - TRAIN-LOGGER - INFO - Epoch 753 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886002 weight_norm_u: 25.222990 loss: 0.961859 +RANK_0 - 2026-01-29 03:18:28,021 - TRAIN-LOGGER - INFO - Epoch 754 - TRAIN - Minibatch 0: weight_norm_model: 143.886002 loss: 0.961859 grad_norm_before_clip: 1.895416 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:29,804 - TRAIN-LOGGER - INFO - Epoch 754 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886002 weight_norm_u: 25.218954 loss: 0.961859 grad_norm_before_clip: 1.895416 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:29,804 - TRAIN-LOGGER - INFO - Epoch 754 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886032 weight_norm_u: 25.222990 loss: 0.966102 +RANK_0 - 2026-01-29 03:18:34,657 - TRAIN-LOGGER - INFO - Epoch 755 - TRAIN - Minibatch 0: weight_norm_model: 143.886032 loss: 0.966102 grad_norm_before_clip: 4.139675 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:35,875 - TRAIN-LOGGER - INFO - Epoch 755 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886032 weight_norm_u: 25.218954 loss: 0.966102 grad_norm_before_clip: 4.139675 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:35,875 - TRAIN-LOGGER - INFO - Epoch 755 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886032 weight_norm_u: 25.222990 loss: 0.966210 +RANK_0 - 2026-01-29 03:18:40,561 - TRAIN-LOGGER - INFO - Epoch 756 - TRAIN - Minibatch 0: weight_norm_model: 143.886032 loss: 0.966210 grad_norm_before_clip: 4.389739 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:42,099 - TRAIN-LOGGER - INFO - Epoch 756 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886032 weight_norm_u: 25.218954 loss: 0.966210 grad_norm_before_clip: 4.389739 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:42,099 - TRAIN-LOGGER - INFO - Epoch 756 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886047 weight_norm_u: 25.222990 loss: 0.962199 +RANK_0 - 2026-01-29 03:18:46,792 - TRAIN-LOGGER - INFO - Epoch 757 - TRAIN - Minibatch 0: weight_norm_model: 143.886047 loss: 0.962199 grad_norm_before_clip: 2.596039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:47,946 - TRAIN-LOGGER - INFO - Epoch 757 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886047 weight_norm_u: 25.218954 loss: 0.962199 grad_norm_before_clip: 2.596039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:47,946 - TRAIN-LOGGER - INFO - Epoch 757 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886032 weight_norm_u: 25.222990 loss: 0.967698 +RANK_0 - 2026-01-29 03:18:52,773 - TRAIN-LOGGER - INFO - Epoch 758 - TRAIN - Minibatch 0: weight_norm_model: 143.886032 loss: 0.967698 grad_norm_before_clip: 6.586399 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:54,413 - TRAIN-LOGGER - INFO - Epoch 758 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886032 weight_norm_u: 25.218954 loss: 0.967698 grad_norm_before_clip: 6.586399 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:18:54,413 - TRAIN-LOGGER - INFO - Epoch 758 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886032 weight_norm_u: 25.222990 loss: 0.974410 +RANK_0 - 2026-01-29 03:18:59,688 - TRAIN-LOGGER - INFO - Epoch 759 - TRAIN - Minibatch 0: weight_norm_model: 143.886032 loss: 0.974410 grad_norm_before_clip: 8.151171 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:00,846 - TRAIN-LOGGER - INFO - Epoch 759 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886032 weight_norm_u: 25.218954 loss: 0.974410 grad_norm_before_clip: 8.151171 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:00,847 - TRAIN-LOGGER - INFO - Epoch 759 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886032 weight_norm_u: 25.222990 loss: 0.973192 +RANK_0 - 2026-01-29 03:19:06,210 - TRAIN-LOGGER - INFO - Epoch 760 - TRAIN - Minibatch 0: weight_norm_model: 143.886032 loss: 0.973192 grad_norm_before_clip: 8.578378 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:07,357 - TRAIN-LOGGER - INFO - Epoch 760 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886032 weight_norm_u: 25.218954 loss: 0.973192 grad_norm_before_clip: 8.578378 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:07,357 - TRAIN-LOGGER - INFO - Epoch 760 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886063 weight_norm_u: 25.222990 loss: 0.962219 +RANK_0 - 2026-01-29 03:19:12,687 - TRAIN-LOGGER - INFO - Epoch 761 - TRAIN - Minibatch 0: weight_norm_model: 143.886063 loss: 0.962219 grad_norm_before_clip: 3.529166 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:13,927 - TRAIN-LOGGER - INFO - Epoch 761 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886063 weight_norm_u: 25.218954 loss: 0.962219 grad_norm_before_clip: 3.529166 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:13,927 - TRAIN-LOGGER - INFO - Epoch 761 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886093 weight_norm_u: 25.222990 loss: 0.962994 +RANK_0 - 2026-01-29 03:19:18,925 - TRAIN-LOGGER - INFO - Epoch 762 - TRAIN - Minibatch 0: weight_norm_model: 143.886093 loss: 0.962994 grad_norm_before_clip: 4.033669 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:20,058 - TRAIN-LOGGER - INFO - Epoch 762 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886093 weight_norm_u: 25.218954 loss: 0.962994 grad_norm_before_clip: 4.033669 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:20,058 - TRAIN-LOGGER - INFO - Epoch 762 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886108 weight_norm_u: 25.222990 loss: 0.967966 +RANK_0 - 2026-01-29 03:19:24,472 - TRAIN-LOGGER - INFO - Epoch 763 - TRAIN - Minibatch 0: weight_norm_model: 143.886108 loss: 0.967966 grad_norm_before_clip: 5.632499 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:25,602 - TRAIN-LOGGER - INFO - Epoch 763 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886108 weight_norm_u: 25.218954 loss: 0.967966 grad_norm_before_clip: 5.632499 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:25,602 - TRAIN-LOGGER - INFO - Epoch 763 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.966161 +RANK_0 - 2026-01-29 03:19:29,996 - TRAIN-LOGGER - INFO - Epoch 764 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.966161 grad_norm_before_clip: 2.760918 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:31,227 - TRAIN-LOGGER - INFO - Epoch 764 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.966161 grad_norm_before_clip: 2.760918 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:31,227 - TRAIN-LOGGER - INFO - Epoch 764 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886108 weight_norm_u: 25.222990 loss: 0.962595 +RANK_0 - 2026-01-29 03:19:35,447 - TRAIN-LOGGER - INFO - Epoch 765 - TRAIN - Minibatch 0: weight_norm_model: 143.886108 loss: 0.962595 grad_norm_before_clip: 2.690733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:36,632 - TRAIN-LOGGER - INFO - Epoch 765 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886108 weight_norm_u: 25.218954 loss: 0.962595 grad_norm_before_clip: 2.690733 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:36,632 - TRAIN-LOGGER - INFO - Epoch 765 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886093 weight_norm_u: 25.222990 loss: 0.962931 +RANK_0 - 2026-01-29 03:19:41,443 - TRAIN-LOGGER - INFO - Epoch 766 - TRAIN - Minibatch 0: weight_norm_model: 143.886093 loss: 0.962931 grad_norm_before_clip: 3.627259 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:42,572 - TRAIN-LOGGER - INFO - Epoch 766 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886093 weight_norm_u: 25.218954 loss: 0.962931 grad_norm_before_clip: 3.627259 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:42,572 - TRAIN-LOGGER - INFO - Epoch 766 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886093 weight_norm_u: 25.222990 loss: 0.966616 +RANK_0 - 2026-01-29 03:19:46,813 - TRAIN-LOGGER - INFO - Epoch 767 - TRAIN - Minibatch 0: weight_norm_model: 143.886093 loss: 0.966616 grad_norm_before_clip: 5.935505 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:48,010 - TRAIN-LOGGER - INFO - Epoch 767 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886093 weight_norm_u: 25.218954 loss: 0.966616 grad_norm_before_clip: 5.935505 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:48,011 - TRAIN-LOGGER - INFO - Epoch 767 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886108 weight_norm_u: 25.222990 loss: 0.963460 +RANK_0 - 2026-01-29 03:19:52,859 - TRAIN-LOGGER - INFO - Epoch 768 - TRAIN - Minibatch 0: weight_norm_model: 143.886108 loss: 0.963460 grad_norm_before_clip: 3.928648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:54,152 - TRAIN-LOGGER - INFO - Epoch 768 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886108 weight_norm_u: 25.218954 loss: 0.963460 grad_norm_before_clip: 3.928648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:19:54,152 - TRAIN-LOGGER - INFO - Epoch 768 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.960470 +RANK_0 - 2026-01-29 03:19:59,113 - TRAIN-LOGGER - INFO - Epoch 769 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.960470 grad_norm_before_clip: 1.214140 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:00,236 - TRAIN-LOGGER - INFO - Epoch 769 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.960470 grad_norm_before_clip: 1.214140 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:00,236 - TRAIN-LOGGER - INFO - Epoch 769 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886139 weight_norm_u: 25.222990 loss: 0.964264 +RANK_0 - 2026-01-29 03:20:05,330 - TRAIN-LOGGER - INFO - Epoch 770 - TRAIN - Minibatch 0: weight_norm_model: 143.886139 loss: 0.964264 grad_norm_before_clip: 4.350967 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:06,475 - TRAIN-LOGGER - INFO - Epoch 770 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886139 weight_norm_u: 25.218954 loss: 0.964264 grad_norm_before_clip: 4.350967 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:06,475 - TRAIN-LOGGER - INFO - Epoch 770 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886139 weight_norm_u: 25.222990 loss: 0.964482 +RANK_0 - 2026-01-29 03:20:11,370 - TRAIN-LOGGER - INFO - Epoch 771 - TRAIN - Minibatch 0: weight_norm_model: 143.886139 loss: 0.964482 grad_norm_before_clip: 2.508428 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:12,537 - TRAIN-LOGGER - INFO - Epoch 771 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886139 weight_norm_u: 25.218954 loss: 0.964482 grad_norm_before_clip: 2.508428 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:12,537 - TRAIN-LOGGER - INFO - Epoch 771 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.963053 +RANK_0 - 2026-01-29 03:20:18,530 - TRAIN-LOGGER - INFO - Epoch 772 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.963053 grad_norm_before_clip: 3.812347 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:19,699 - TRAIN-LOGGER - INFO - Epoch 772 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.963053 grad_norm_before_clip: 3.812347 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:19,700 - TRAIN-LOGGER - INFO - Epoch 772 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.961368 +RANK_0 - 2026-01-29 03:20:25,705 - TRAIN-LOGGER - INFO - Epoch 773 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.961368 grad_norm_before_clip: 2.087993 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:26,864 - TRAIN-LOGGER - INFO - Epoch 773 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.961368 grad_norm_before_clip: 2.087993 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:26,864 - TRAIN-LOGGER - INFO - Epoch 773 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886108 weight_norm_u: 25.222990 loss: 0.961590 +RANK_0 - 2026-01-29 03:20:32,296 - TRAIN-LOGGER - INFO - Epoch 774 - TRAIN - Minibatch 0: weight_norm_model: 143.886108 loss: 0.961590 grad_norm_before_clip: 2.678245 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:33,435 - TRAIN-LOGGER - INFO - Epoch 774 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886108 weight_norm_u: 25.218954 loss: 0.961590 grad_norm_before_clip: 2.678245 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:33,436 - TRAIN-LOGGER - INFO - Epoch 774 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.961423 +RANK_0 - 2026-01-29 03:20:38,309 - TRAIN-LOGGER - INFO - Epoch 775 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.961423 grad_norm_before_clip: 0.913039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:39,465 - TRAIN-LOGGER - INFO - Epoch 775 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.961423 grad_norm_before_clip: 0.913039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:39,466 - TRAIN-LOGGER - INFO - Epoch 775 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.962599 +RANK_0 - 2026-01-29 03:20:44,481 - TRAIN-LOGGER - INFO - Epoch 776 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.962599 grad_norm_before_clip: 2.157643 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:45,647 - TRAIN-LOGGER - INFO - Epoch 776 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.962599 grad_norm_before_clip: 2.157643 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:45,647 - TRAIN-LOGGER - INFO - Epoch 776 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.962199 +RANK_0 - 2026-01-29 03:20:49,983 - TRAIN-LOGGER - INFO - Epoch 777 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.962199 grad_norm_before_clip: 1.578539 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:51,205 - TRAIN-LOGGER - INFO - Epoch 777 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.962199 grad_norm_before_clip: 1.578539 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:51,205 - TRAIN-LOGGER - INFO - Epoch 777 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886124 weight_norm_u: 25.222990 loss: 0.962943 +RANK_0 - 2026-01-29 03:20:55,778 - TRAIN-LOGGER - INFO - Epoch 778 - TRAIN - Minibatch 0: weight_norm_model: 143.886124 loss: 0.962943 grad_norm_before_clip: 3.417616 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:56,979 - TRAIN-LOGGER - INFO - Epoch 778 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886124 weight_norm_u: 25.218954 loss: 0.962943 grad_norm_before_clip: 3.417616 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:20:56,980 - TRAIN-LOGGER - INFO - Epoch 778 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886139 weight_norm_u: 25.222990 loss: 0.964088 +RANK_0 - 2026-01-29 03:21:01,136 - TRAIN-LOGGER - INFO - Epoch 779 - TRAIN - Minibatch 0: weight_norm_model: 143.886139 loss: 0.964088 grad_norm_before_clip: 4.658168 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:02,296 - TRAIN-LOGGER - INFO - Epoch 779 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886139 weight_norm_u: 25.218954 loss: 0.964088 grad_norm_before_clip: 4.658168 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:02,297 - TRAIN-LOGGER - INFO - Epoch 779 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886139 weight_norm_u: 25.222990 loss: 0.962800 +RANK_0 - 2026-01-29 03:21:07,002 - TRAIN-LOGGER - INFO - Epoch 780 - TRAIN - Minibatch 0: weight_norm_model: 143.886139 loss: 0.962800 grad_norm_before_clip: 2.552719 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:08,176 - TRAIN-LOGGER - INFO - Epoch 780 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886139 weight_norm_u: 25.218954 loss: 0.962800 grad_norm_before_clip: 2.552719 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:08,176 - TRAIN-LOGGER - INFO - Epoch 780 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886154 weight_norm_u: 25.222990 loss: 0.962566 +RANK_0 - 2026-01-29 03:21:12,909 - TRAIN-LOGGER - INFO - Epoch 781 - TRAIN - Minibatch 0: weight_norm_model: 143.886154 loss: 0.962566 grad_norm_before_clip: 2.147146 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:14,097 - TRAIN-LOGGER - INFO - Epoch 781 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886154 weight_norm_u: 25.218954 loss: 0.962566 grad_norm_before_clip: 2.147146 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:14,097 - TRAIN-LOGGER - INFO - Epoch 781 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886169 weight_norm_u: 25.222990 loss: 0.961035 +RANK_0 - 2026-01-29 03:21:19,425 - TRAIN-LOGGER - INFO - Epoch 782 - TRAIN - Minibatch 0: weight_norm_model: 143.886169 loss: 0.961035 grad_norm_before_clip: 2.926412 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:20,706 - TRAIN-LOGGER - INFO - Epoch 782 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886169 weight_norm_u: 25.218954 loss: 0.961035 grad_norm_before_clip: 2.926412 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:20,706 - TRAIN-LOGGER - INFO - Epoch 782 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886169 weight_norm_u: 25.222990 loss: 0.961646 +RANK_0 - 2026-01-29 03:21:26,156 - TRAIN-LOGGER - INFO - Epoch 783 - TRAIN - Minibatch 0: weight_norm_model: 143.886169 loss: 0.961646 grad_norm_before_clip: 2.099876 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:27,350 - TRAIN-LOGGER - INFO - Epoch 783 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886169 weight_norm_u: 25.218954 loss: 0.961646 grad_norm_before_clip: 2.099876 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:27,350 - TRAIN-LOGGER - INFO - Epoch 783 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886154 weight_norm_u: 25.222990 loss: 0.961499 +RANK_0 - 2026-01-29 03:21:32,937 - TRAIN-LOGGER - INFO - Epoch 784 - TRAIN - Minibatch 0: weight_norm_model: 143.886154 loss: 0.961499 grad_norm_before_clip: 2.928499 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:34,373 - TRAIN-LOGGER - INFO - Epoch 784 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886154 weight_norm_u: 25.218954 loss: 0.961499 grad_norm_before_clip: 2.928499 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:34,374 - TRAIN-LOGGER - INFO - Epoch 784 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886154 weight_norm_u: 25.222990 loss: 0.961205 +RANK_0 - 2026-01-29 03:21:39,690 - TRAIN-LOGGER - INFO - Epoch 785 - TRAIN - Minibatch 0: weight_norm_model: 143.886154 loss: 0.961205 grad_norm_before_clip: 4.208206 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:40,948 - TRAIN-LOGGER - INFO - Epoch 785 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886154 weight_norm_u: 25.218954 loss: 0.961205 grad_norm_before_clip: 4.208206 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:40,948 - TRAIN-LOGGER - INFO - Epoch 785 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886169 weight_norm_u: 25.222990 loss: 0.960436 +RANK_0 - 2026-01-29 03:21:46,218 - TRAIN-LOGGER - INFO - Epoch 786 - TRAIN - Minibatch 0: weight_norm_model: 143.886169 loss: 0.960436 grad_norm_before_clip: 1.435474 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:47,344 - TRAIN-LOGGER - INFO - Epoch 786 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886169 weight_norm_u: 25.218954 loss: 0.960436 grad_norm_before_clip: 1.435474 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:47,344 - TRAIN-LOGGER - INFO - Epoch 786 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886169 weight_norm_u: 25.222990 loss: 0.962319 +RANK_0 - 2026-01-29 03:21:51,777 - TRAIN-LOGGER - INFO - Epoch 787 - TRAIN - Minibatch 0: weight_norm_model: 143.886169 loss: 0.962319 grad_norm_before_clip: 5.093948 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:52,924 - TRAIN-LOGGER - INFO - Epoch 787 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886169 weight_norm_u: 25.218954 loss: 0.962319 grad_norm_before_clip: 5.093948 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:52,924 - TRAIN-LOGGER - INFO - Epoch 787 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886169 weight_norm_u: 25.222990 loss: 0.962869 +RANK_0 - 2026-01-29 03:21:57,615 - TRAIN-LOGGER - INFO - Epoch 788 - TRAIN - Minibatch 0: weight_norm_model: 143.886169 loss: 0.962869 grad_norm_before_clip: 3.555607 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:59,107 - TRAIN-LOGGER - INFO - Epoch 788 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886169 weight_norm_u: 25.218954 loss: 0.962869 grad_norm_before_clip: 3.555607 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:21:59,107 - TRAIN-LOGGER - INFO - Epoch 788 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886169 weight_norm_u: 25.222990 loss: 0.961667 +RANK_0 - 2026-01-29 03:22:03,570 - TRAIN-LOGGER - INFO - Epoch 789 - TRAIN - Minibatch 0: weight_norm_model: 143.886169 loss: 0.961667 grad_norm_before_clip: 1.908776 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:04,704 - TRAIN-LOGGER - INFO - Epoch 789 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886169 weight_norm_u: 25.218954 loss: 0.961667 grad_norm_before_clip: 1.908776 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:04,704 - TRAIN-LOGGER - INFO - Epoch 789 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886154 weight_norm_u: 25.222990 loss: 0.962466 +RANK_0 - 2026-01-29 03:22:09,443 - TRAIN-LOGGER - INFO - Epoch 790 - TRAIN - Minibatch 0: weight_norm_model: 143.886154 loss: 0.962466 grad_norm_before_clip: 2.106135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:10,861 - TRAIN-LOGGER - INFO - Epoch 790 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886154 weight_norm_u: 25.218954 loss: 0.962466 grad_norm_before_clip: 2.106135 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:10,862 - TRAIN-LOGGER - INFO - Epoch 790 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886169 weight_norm_u: 25.222990 loss: 0.962922 +RANK_0 - 2026-01-29 03:22:15,425 - TRAIN-LOGGER - INFO - Epoch 791 - TRAIN - Minibatch 0: weight_norm_model: 143.886169 loss: 0.962922 grad_norm_before_clip: 1.783530 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:16,696 - TRAIN-LOGGER - INFO - Epoch 791 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886169 weight_norm_u: 25.218954 loss: 0.962922 grad_norm_before_clip: 1.783530 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:16,696 - TRAIN-LOGGER - INFO - Epoch 791 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886200 weight_norm_u: 25.222990 loss: 0.961589 +RANK_0 - 2026-01-29 03:22:21,291 - TRAIN-LOGGER - INFO - Epoch 792 - TRAIN - Minibatch 0: weight_norm_model: 143.886200 loss: 0.961589 grad_norm_before_clip: 2.857024 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:22,543 - TRAIN-LOGGER - INFO - Epoch 792 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886200 weight_norm_u: 25.218954 loss: 0.961589 grad_norm_before_clip: 2.857024 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:22,543 - TRAIN-LOGGER - INFO - Epoch 792 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886230 weight_norm_u: 25.222990 loss: 0.962936 +RANK_0 - 2026-01-29 03:22:27,046 - TRAIN-LOGGER - INFO - Epoch 793 - TRAIN - Minibatch 0: weight_norm_model: 143.886230 loss: 0.962936 grad_norm_before_clip: 2.536499 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:28,359 - TRAIN-LOGGER - INFO - Epoch 793 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886230 weight_norm_u: 25.218954 loss: 0.962936 grad_norm_before_clip: 2.536499 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:28,359 - TRAIN-LOGGER - INFO - Epoch 793 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886230 weight_norm_u: 25.222990 loss: 0.962442 +RANK_0 - 2026-01-29 03:22:32,534 - TRAIN-LOGGER - INFO - Epoch 794 - TRAIN - Minibatch 0: weight_norm_model: 143.886230 loss: 0.962442 grad_norm_before_clip: 2.950158 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:33,785 - TRAIN-LOGGER - INFO - Epoch 794 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886230 weight_norm_u: 25.218954 loss: 0.962442 grad_norm_before_clip: 2.950158 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:33,786 - TRAIN-LOGGER - INFO - Epoch 794 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886230 weight_norm_u: 25.222990 loss: 0.961628 +RANK_0 - 2026-01-29 03:22:39,138 - TRAIN-LOGGER - INFO - Epoch 795 - TRAIN - Minibatch 0: weight_norm_model: 143.886230 loss: 0.961628 grad_norm_before_clip: 1.989537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:40,338 - TRAIN-LOGGER - INFO - Epoch 795 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886230 weight_norm_u: 25.218954 loss: 0.961628 grad_norm_before_clip: 1.989537 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:40,338 - TRAIN-LOGGER - INFO - Epoch 795 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886230 weight_norm_u: 25.222990 loss: 0.961117 +RANK_0 - 2026-01-29 03:22:45,089 - TRAIN-LOGGER - INFO - Epoch 796 - TRAIN - Minibatch 0: weight_norm_model: 143.886230 loss: 0.961117 grad_norm_before_clip: 4.173375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:46,277 - TRAIN-LOGGER - INFO - Epoch 796 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886230 weight_norm_u: 25.218954 loss: 0.961117 grad_norm_before_clip: 4.173375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:46,277 - TRAIN-LOGGER - INFO - Epoch 796 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886230 weight_norm_u: 25.222990 loss: 0.961672 +RANK_0 - 2026-01-29 03:22:51,158 - TRAIN-LOGGER - INFO - Epoch 797 - TRAIN - Minibatch 0: weight_norm_model: 143.886230 loss: 0.961672 grad_norm_before_clip: 3.948949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:52,291 - TRAIN-LOGGER - INFO - Epoch 797 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886230 weight_norm_u: 25.218954 loss: 0.961672 grad_norm_before_clip: 3.948949 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:52,291 - TRAIN-LOGGER - INFO - Epoch 797 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886261 weight_norm_u: 25.222990 loss: 0.963513 +RANK_0 - 2026-01-29 03:22:56,672 - TRAIN-LOGGER - INFO - Epoch 798 - TRAIN - Minibatch 0: weight_norm_model: 143.886261 loss: 0.963513 grad_norm_before_clip: 4.101613 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:57,868 - TRAIN-LOGGER - INFO - Epoch 798 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886261 weight_norm_u: 25.218954 loss: 0.963513 grad_norm_before_clip: 4.101613 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:22:57,868 - TRAIN-LOGGER - INFO - Epoch 798 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886261 weight_norm_u: 25.222990 loss: 0.961718 +RANK_0 - 2026-01-29 03:23:02,937 - TRAIN-LOGGER - INFO - Epoch 799 - TRAIN - Minibatch 0: weight_norm_model: 143.886261 loss: 0.961718 grad_norm_before_clip: 2.519527 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:04,102 - TRAIN-LOGGER - INFO - Epoch 799 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886261 weight_norm_u: 25.218954 loss: 0.961718 grad_norm_before_clip: 2.519527 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:04,103 - TRAIN-LOGGER - INFO - Epoch 799 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886276 weight_norm_u: 25.222990 loss: 0.961387 +RANK_0 - 2026-01-29 03:23:09,205 - TRAIN-LOGGER - INFO - Epoch 800 - TRAIN - Minibatch 0: weight_norm_model: 143.886276 loss: 0.961387 grad_norm_before_clip: 2.965208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:10,344 - TRAIN-LOGGER - INFO - Epoch 800 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886276 weight_norm_u: 25.218954 loss: 0.961387 grad_norm_before_clip: 2.965208 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:10,344 - TRAIN-LOGGER - INFO - Epoch 800 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886276 weight_norm_u: 25.222990 loss: 0.962601 +RANK_0 - 2026-01-29 03:23:15,594 - TRAIN-LOGGER - INFO - Epoch 801 - TRAIN - Minibatch 0: weight_norm_model: 143.886276 loss: 0.962601 grad_norm_before_clip: 5.318474 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:16,749 - TRAIN-LOGGER - INFO - Epoch 801 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886276 weight_norm_u: 25.218954 loss: 0.962601 grad_norm_before_clip: 5.318474 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:16,749 - TRAIN-LOGGER - INFO - Epoch 801 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886276 weight_norm_u: 25.222990 loss: 0.961759 +RANK_0 - 2026-01-29 03:23:21,701 - TRAIN-LOGGER - INFO - Epoch 802 - TRAIN - Minibatch 0: weight_norm_model: 143.886276 loss: 0.961759 grad_norm_before_clip: 5.055034 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:22,942 - TRAIN-LOGGER - INFO - Epoch 802 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886276 weight_norm_u: 25.218954 loss: 0.961759 grad_norm_before_clip: 5.055034 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:22,942 - TRAIN-LOGGER - INFO - Epoch 802 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886292 weight_norm_u: 25.222990 loss: 0.961168 +RANK_0 - 2026-01-29 03:23:28,496 - TRAIN-LOGGER - INFO - Epoch 803 - TRAIN - Minibatch 0: weight_norm_model: 143.886292 loss: 0.961168 grad_norm_before_clip: 2.824112 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:29,730 - TRAIN-LOGGER - INFO - Epoch 803 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886292 weight_norm_u: 25.218954 loss: 0.961168 grad_norm_before_clip: 2.824112 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:29,730 - TRAIN-LOGGER - INFO - Epoch 803 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886292 weight_norm_u: 25.222990 loss: 0.960850 +RANK_0 - 2026-01-29 03:23:33,864 - TRAIN-LOGGER - INFO - Epoch 804 - TRAIN - Minibatch 0: weight_norm_model: 143.886292 loss: 0.960850 grad_norm_before_clip: 1.970159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:35,109 - TRAIN-LOGGER - INFO - Epoch 804 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886292 weight_norm_u: 25.218954 loss: 0.960850 grad_norm_before_clip: 1.970159 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:35,109 - TRAIN-LOGGER - INFO - Epoch 804 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886307 weight_norm_u: 25.222990 loss: 0.961215 +RANK_0 - 2026-01-29 03:23:39,941 - TRAIN-LOGGER - INFO - Epoch 805 - TRAIN - Minibatch 0: weight_norm_model: 143.886307 loss: 0.961215 grad_norm_before_clip: 3.300585 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:41,122 - TRAIN-LOGGER - INFO - Epoch 805 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886307 weight_norm_u: 25.218954 loss: 0.961215 grad_norm_before_clip: 3.300585 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:41,122 - TRAIN-LOGGER - INFO - Epoch 805 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886322 weight_norm_u: 25.222990 loss: 0.962864 +RANK_0 - 2026-01-29 03:23:45,442 - TRAIN-LOGGER - INFO - Epoch 806 - TRAIN - Minibatch 0: weight_norm_model: 143.886322 loss: 0.962864 grad_norm_before_clip: 4.290178 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:46,584 - TRAIN-LOGGER - INFO - Epoch 806 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886322 weight_norm_u: 25.218954 loss: 0.962864 grad_norm_before_clip: 4.290178 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:46,584 - TRAIN-LOGGER - INFO - Epoch 806 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886322 weight_norm_u: 25.222990 loss: 0.960835 +RANK_0 - 2026-01-29 03:23:51,491 - TRAIN-LOGGER - INFO - Epoch 807 - TRAIN - Minibatch 0: weight_norm_model: 143.886322 loss: 0.960835 grad_norm_before_clip: 1.475255 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:52,679 - TRAIN-LOGGER - INFO - Epoch 807 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886322 weight_norm_u: 25.218954 loss: 0.960835 grad_norm_before_clip: 1.475255 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:52,680 - TRAIN-LOGGER - INFO - Epoch 807 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886322 weight_norm_u: 25.222990 loss: 0.963683 +RANK_0 - 2026-01-29 03:23:57,300 - TRAIN-LOGGER - INFO - Epoch 808 - TRAIN - Minibatch 0: weight_norm_model: 143.886322 loss: 0.963683 grad_norm_before_clip: 3.462185 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:58,442 - TRAIN-LOGGER - INFO - Epoch 808 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886322 weight_norm_u: 25.218954 loss: 0.963683 grad_norm_before_clip: 3.462185 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:23:58,442 - TRAIN-LOGGER - INFO - Epoch 808 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886322 weight_norm_u: 25.222990 loss: 0.967699 +RANK_0 - 2026-01-29 03:24:03,455 - TRAIN-LOGGER - INFO - Epoch 809 - TRAIN - Minibatch 0: weight_norm_model: 143.886322 loss: 0.967699 grad_norm_before_clip: 4.905657 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:04,612 - TRAIN-LOGGER - INFO - Epoch 809 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886322 weight_norm_u: 25.218954 loss: 0.967699 grad_norm_before_clip: 4.905657 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:04,612 - TRAIN-LOGGER - INFO - Epoch 809 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886322 weight_norm_u: 25.222990 loss: 0.966261 +RANK_0 - 2026-01-29 03:24:09,105 - TRAIN-LOGGER - INFO - Epoch 810 - TRAIN - Minibatch 0: weight_norm_model: 143.886322 loss: 0.966261 grad_norm_before_clip: 3.898201 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:10,328 - TRAIN-LOGGER - INFO - Epoch 810 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886322 weight_norm_u: 25.218954 loss: 0.966261 grad_norm_before_clip: 3.898201 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:10,328 - TRAIN-LOGGER - INFO - Epoch 810 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886337 weight_norm_u: 25.222990 loss: 0.963948 +RANK_0 - 2026-01-29 03:24:15,003 - TRAIN-LOGGER - INFO - Epoch 811 - TRAIN - Minibatch 0: weight_norm_model: 143.886337 loss: 0.963948 grad_norm_before_clip: 2.711547 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:16,234 - TRAIN-LOGGER - INFO - Epoch 811 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886337 weight_norm_u: 25.218954 loss: 0.963948 grad_norm_before_clip: 2.711547 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:16,235 - TRAIN-LOGGER - INFO - Epoch 811 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886353 weight_norm_u: 25.222990 loss: 0.963071 +RANK_0 - 2026-01-29 03:24:20,911 - TRAIN-LOGGER - INFO - Epoch 812 - TRAIN - Minibatch 0: weight_norm_model: 143.886353 loss: 0.963071 grad_norm_before_clip: 3.010462 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:22,132 - TRAIN-LOGGER - INFO - Epoch 812 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886353 weight_norm_u: 25.218954 loss: 0.963071 grad_norm_before_clip: 3.010462 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:22,132 - TRAIN-LOGGER - INFO - Epoch 812 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886353 weight_norm_u: 25.222990 loss: 0.963742 +RANK_0 - 2026-01-29 03:24:26,626 - TRAIN-LOGGER - INFO - Epoch 813 - TRAIN - Minibatch 0: weight_norm_model: 143.886353 loss: 0.963742 grad_norm_before_clip: 2.298132 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:28,101 - TRAIN-LOGGER - INFO - Epoch 813 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886353 weight_norm_u: 25.218954 loss: 0.963742 grad_norm_before_clip: 2.298132 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:28,101 - TRAIN-LOGGER - INFO - Epoch 813 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886353 weight_norm_u: 25.222990 loss: 0.961872 +RANK_0 - 2026-01-29 03:24:32,820 - TRAIN-LOGGER - INFO - Epoch 814 - TRAIN - Minibatch 0: weight_norm_model: 143.886353 loss: 0.961872 grad_norm_before_clip: 2.511525 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:33,974 - TRAIN-LOGGER - INFO - Epoch 814 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886353 weight_norm_u: 25.218954 loss: 0.961872 grad_norm_before_clip: 2.511525 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:33,975 - TRAIN-LOGGER - INFO - Epoch 814 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886337 weight_norm_u: 25.222990 loss: 0.962085 +RANK_0 - 2026-01-29 03:24:38,272 - TRAIN-LOGGER - INFO - Epoch 815 - TRAIN - Minibatch 0: weight_norm_model: 143.886337 loss: 0.962085 grad_norm_before_clip: 2.620359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:39,465 - TRAIN-LOGGER - INFO - Epoch 815 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886337 weight_norm_u: 25.218954 loss: 0.962085 grad_norm_before_clip: 2.620359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:39,465 - TRAIN-LOGGER - INFO - Epoch 815 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886353 weight_norm_u: 25.222990 loss: 0.963407 +RANK_0 - 2026-01-29 03:24:44,489 - TRAIN-LOGGER - INFO - Epoch 816 - TRAIN - Minibatch 0: weight_norm_model: 143.886353 loss: 0.963407 grad_norm_before_clip: 3.796615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:45,813 - TRAIN-LOGGER - INFO - Epoch 816 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886353 weight_norm_u: 25.218954 loss: 0.963407 grad_norm_before_clip: 3.796615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:45,814 - TRAIN-LOGGER - INFO - Epoch 816 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886383 weight_norm_u: 25.222990 loss: 0.961746 +RANK_0 - 2026-01-29 03:24:50,389 - TRAIN-LOGGER - INFO - Epoch 817 - TRAIN - Minibatch 0: weight_norm_model: 143.886383 loss: 0.961746 grad_norm_before_clip: 2.825577 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:51,609 - TRAIN-LOGGER - INFO - Epoch 817 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886383 weight_norm_u: 25.218954 loss: 0.961746 grad_norm_before_clip: 2.825577 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:51,609 - TRAIN-LOGGER - INFO - Epoch 817 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886414 weight_norm_u: 25.222990 loss: 0.961822 +RANK_0 - 2026-01-29 03:24:57,070 - TRAIN-LOGGER - INFO - Epoch 818 - TRAIN - Minibatch 0: weight_norm_model: 143.886414 loss: 0.961822 grad_norm_before_clip: 3.431979 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:58,243 - TRAIN-LOGGER - INFO - Epoch 818 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886414 weight_norm_u: 25.218954 loss: 0.961822 grad_norm_before_clip: 3.431979 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:24:58,244 - TRAIN-LOGGER - INFO - Epoch 818 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886429 weight_norm_u: 25.222990 loss: 0.962625 +RANK_0 - 2026-01-29 03:25:03,040 - TRAIN-LOGGER - INFO - Epoch 819 - TRAIN - Minibatch 0: weight_norm_model: 143.886429 loss: 0.962625 grad_norm_before_clip: 3.175428 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:04,257 - TRAIN-LOGGER - INFO - Epoch 819 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886429 weight_norm_u: 25.218954 loss: 0.962625 grad_norm_before_clip: 3.175428 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:04,257 - TRAIN-LOGGER - INFO - Epoch 819 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886444 weight_norm_u: 25.222990 loss: 0.962660 +RANK_0 - 2026-01-29 03:25:09,329 - TRAIN-LOGGER - INFO - Epoch 820 - TRAIN - Minibatch 0: weight_norm_model: 143.886444 loss: 0.962660 grad_norm_before_clip: 3.707267 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:10,497 - TRAIN-LOGGER - INFO - Epoch 820 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886444 weight_norm_u: 25.218954 loss: 0.962660 grad_norm_before_clip: 3.707267 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:10,498 - TRAIN-LOGGER - INFO - Epoch 820 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886429 weight_norm_u: 25.222990 loss: 0.962698 +RANK_0 - 2026-01-29 03:25:15,339 - TRAIN-LOGGER - INFO - Epoch 821 - TRAIN - Minibatch 0: weight_norm_model: 143.886429 loss: 0.962698 grad_norm_before_clip: 3.820947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:16,550 - TRAIN-LOGGER - INFO - Epoch 821 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886429 weight_norm_u: 25.218954 loss: 0.962698 grad_norm_before_clip: 3.820947 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:16,550 - TRAIN-LOGGER - INFO - Epoch 821 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886429 weight_norm_u: 25.222990 loss: 0.964699 +RANK_0 - 2026-01-29 03:25:21,638 - TRAIN-LOGGER - INFO - Epoch 822 - TRAIN - Minibatch 0: weight_norm_model: 143.886429 loss: 0.964699 grad_norm_before_clip: 4.887982 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:22,908 - TRAIN-LOGGER - INFO - Epoch 822 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886429 weight_norm_u: 25.218954 loss: 0.964699 grad_norm_before_clip: 4.887982 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:22,908 - TRAIN-LOGGER - INFO - Epoch 822 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886429 weight_norm_u: 25.222990 loss: 0.964999 +RANK_0 - 2026-01-29 03:25:27,576 - TRAIN-LOGGER - INFO - Epoch 823 - TRAIN - Minibatch 0: weight_norm_model: 143.886429 loss: 0.964999 grad_norm_before_clip: 5.042187 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:28,692 - TRAIN-LOGGER - INFO - Epoch 823 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886429 weight_norm_u: 25.218954 loss: 0.964999 grad_norm_before_clip: 5.042187 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:28,693 - TRAIN-LOGGER - INFO - Epoch 823 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886444 weight_norm_u: 25.222990 loss: 0.962897 +RANK_0 - 2026-01-29 03:25:33,822 - TRAIN-LOGGER - INFO - Epoch 824 - TRAIN - Minibatch 0: weight_norm_model: 143.886444 loss: 0.962897 grad_norm_before_clip: 3.436246 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:35,036 - TRAIN-LOGGER - INFO - Epoch 824 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886444 weight_norm_u: 25.218954 loss: 0.962897 grad_norm_before_clip: 3.436246 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:35,036 - TRAIN-LOGGER - INFO - Epoch 824 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886444 weight_norm_u: 25.222990 loss: 0.963052 +RANK_0 - 2026-01-29 03:25:39,874 - TRAIN-LOGGER - INFO - Epoch 825 - TRAIN - Minibatch 0: weight_norm_model: 143.886444 loss: 0.963052 grad_norm_before_clip: 4.326752 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:41,078 - TRAIN-LOGGER - INFO - Epoch 825 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886444 weight_norm_u: 25.218954 loss: 0.963052 grad_norm_before_clip: 4.326752 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:41,079 - TRAIN-LOGGER - INFO - Epoch 825 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886444 weight_norm_u: 25.222990 loss: 0.965038 +RANK_0 - 2026-01-29 03:25:45,499 - TRAIN-LOGGER - INFO - Epoch 826 - TRAIN - Minibatch 0: weight_norm_model: 143.886444 loss: 0.965038 grad_norm_before_clip: 4.574990 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:47,009 - TRAIN-LOGGER - INFO - Epoch 826 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886444 weight_norm_u: 25.218954 loss: 0.965038 grad_norm_before_clip: 4.574990 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:47,009 - TRAIN-LOGGER - INFO - Epoch 826 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886429 weight_norm_u: 25.222990 loss: 0.962015 +RANK_0 - 2026-01-29 03:25:51,216 - TRAIN-LOGGER - INFO - Epoch 827 - TRAIN - Minibatch 0: weight_norm_model: 143.886429 loss: 0.962015 grad_norm_before_clip: 2.140461 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:52,354 - TRAIN-LOGGER - INFO - Epoch 827 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886429 weight_norm_u: 25.218954 loss: 0.962015 grad_norm_before_clip: 2.140461 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:52,354 - TRAIN-LOGGER - INFO - Epoch 827 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886429 weight_norm_u: 25.222990 loss: 0.960513 +RANK_0 - 2026-01-29 03:25:56,820 - TRAIN-LOGGER - INFO - Epoch 828 - TRAIN - Minibatch 0: weight_norm_model: 143.886429 loss: 0.960513 grad_norm_before_clip: 2.398084 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:58,077 - TRAIN-LOGGER - INFO - Epoch 828 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886429 weight_norm_u: 25.218954 loss: 0.960513 grad_norm_before_clip: 2.398084 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:25:58,078 - TRAIN-LOGGER - INFO - Epoch 828 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886414 weight_norm_u: 25.222990 loss: 0.964091 +RANK_0 - 2026-01-29 03:26:02,997 - TRAIN-LOGGER - INFO - Epoch 829 - TRAIN - Minibatch 0: weight_norm_model: 143.886414 loss: 0.964091 grad_norm_before_clip: 4.044510 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:04,159 - TRAIN-LOGGER - INFO - Epoch 829 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886414 weight_norm_u: 25.218954 loss: 0.964091 grad_norm_before_clip: 4.044510 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:04,159 - TRAIN-LOGGER - INFO - Epoch 829 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886414 weight_norm_u: 25.222990 loss: 0.964620 +RANK_0 - 2026-01-29 03:26:08,971 - TRAIN-LOGGER - INFO - Epoch 830 - TRAIN - Minibatch 0: weight_norm_model: 143.886414 loss: 0.964620 grad_norm_before_clip: 4.054648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:10,095 - TRAIN-LOGGER - INFO - Epoch 830 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886414 weight_norm_u: 25.218954 loss: 0.964620 grad_norm_before_clip: 4.054648 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:10,095 - TRAIN-LOGGER - INFO - Epoch 830 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886429 weight_norm_u: 25.222990 loss: 0.960869 +RANK_0 - 2026-01-29 03:26:15,359 - TRAIN-LOGGER - INFO - Epoch 831 - TRAIN - Minibatch 0: weight_norm_model: 143.886429 loss: 0.960869 grad_norm_before_clip: 1.845197 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:16,553 - TRAIN-LOGGER - INFO - Epoch 831 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886429 weight_norm_u: 25.218954 loss: 0.960869 grad_norm_before_clip: 1.845197 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:16,554 - TRAIN-LOGGER - INFO - Epoch 831 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886459 weight_norm_u: 25.222990 loss: 0.962343 +RANK_0 - 2026-01-29 03:26:20,904 - TRAIN-LOGGER - INFO - Epoch 832 - TRAIN - Minibatch 0: weight_norm_model: 143.886459 loss: 0.962343 grad_norm_before_clip: 2.296421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:22,035 - TRAIN-LOGGER - INFO - Epoch 832 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886459 weight_norm_u: 25.218954 loss: 0.962343 grad_norm_before_clip: 2.296421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:22,035 - TRAIN-LOGGER - INFO - Epoch 832 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886475 weight_norm_u: 25.222990 loss: 0.962285 +RANK_0 - 2026-01-29 03:26:27,414 - TRAIN-LOGGER - INFO - Epoch 833 - TRAIN - Minibatch 0: weight_norm_model: 143.886475 loss: 0.962285 grad_norm_before_clip: 3.514596 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:28,567 - TRAIN-LOGGER - INFO - Epoch 833 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886475 weight_norm_u: 25.218954 loss: 0.962285 grad_norm_before_clip: 3.514596 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:28,567 - TRAIN-LOGGER - INFO - Epoch 833 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886459 weight_norm_u: 25.222990 loss: 0.960131 +RANK_0 - 2026-01-29 03:26:33,454 - TRAIN-LOGGER - INFO - Epoch 834 - TRAIN - Minibatch 0: weight_norm_model: 143.886459 loss: 0.960131 grad_norm_before_clip: 2.164065 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:34,699 - TRAIN-LOGGER - INFO - Epoch 834 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886459 weight_norm_u: 25.218954 loss: 0.960131 grad_norm_before_clip: 2.164065 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:34,699 - TRAIN-LOGGER - INFO - Epoch 834 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886444 weight_norm_u: 25.222990 loss: 0.963393 +RANK_0 - 2026-01-29 03:26:39,655 - TRAIN-LOGGER - INFO - Epoch 835 - TRAIN - Minibatch 0: weight_norm_model: 143.886444 loss: 0.963393 grad_norm_before_clip: 4.202633 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:40,814 - TRAIN-LOGGER - INFO - Epoch 835 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886444 weight_norm_u: 25.218954 loss: 0.963393 grad_norm_before_clip: 4.202633 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:40,814 - TRAIN-LOGGER - INFO - Epoch 835 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886459 weight_norm_u: 25.222990 loss: 0.965654 +RANK_0 - 2026-01-29 03:26:45,087 - TRAIN-LOGGER - INFO - Epoch 836 - TRAIN - Minibatch 0: weight_norm_model: 143.886459 loss: 0.965654 grad_norm_before_clip: 5.022494 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:46,250 - TRAIN-LOGGER - INFO - Epoch 836 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886459 weight_norm_u: 25.218954 loss: 0.965654 grad_norm_before_clip: 5.022494 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:46,251 - TRAIN-LOGGER - INFO - Epoch 836 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886475 weight_norm_u: 25.222990 loss: 0.963857 +RANK_0 - 2026-01-29 03:26:50,873 - TRAIN-LOGGER - INFO - Epoch 837 - TRAIN - Minibatch 0: weight_norm_model: 143.886475 loss: 0.963857 grad_norm_before_clip: 3.819332 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:52,318 - TRAIN-LOGGER - INFO - Epoch 837 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886475 weight_norm_u: 25.218954 loss: 0.963857 grad_norm_before_clip: 3.819332 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:52,318 - TRAIN-LOGGER - INFO - Epoch 837 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886505 weight_norm_u: 25.222990 loss: 0.962548 +RANK_0 - 2026-01-29 03:26:57,046 - TRAIN-LOGGER - INFO - Epoch 838 - TRAIN - Minibatch 0: weight_norm_model: 143.886505 loss: 0.962548 grad_norm_before_clip: 3.557421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:58,233 - TRAIN-LOGGER - INFO - Epoch 838 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886505 weight_norm_u: 25.218954 loss: 0.962548 grad_norm_before_clip: 3.557421 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:26:58,233 - TRAIN-LOGGER - INFO - Epoch 838 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886520 weight_norm_u: 25.222990 loss: 0.965447 +RANK_0 - 2026-01-29 03:27:02,885 - TRAIN-LOGGER - INFO - Epoch 839 - TRAIN - Minibatch 0: weight_norm_model: 143.886520 loss: 0.965447 grad_norm_before_clip: 4.053793 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:04,211 - TRAIN-LOGGER - INFO - Epoch 839 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886520 weight_norm_u: 25.218954 loss: 0.965447 grad_norm_before_clip: 4.053793 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:04,211 - TRAIN-LOGGER - INFO - Epoch 839 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886536 weight_norm_u: 25.222990 loss: 0.963093 +RANK_0 - 2026-01-29 03:27:08,994 - TRAIN-LOGGER - INFO - Epoch 840 - TRAIN - Minibatch 0: weight_norm_model: 143.886536 loss: 0.963093 grad_norm_before_clip: 4.151798 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:10,223 - TRAIN-LOGGER - INFO - Epoch 840 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886536 weight_norm_u: 25.218954 loss: 0.963093 grad_norm_before_clip: 4.151798 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:10,223 - TRAIN-LOGGER - INFO - Epoch 840 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886536 weight_norm_u: 25.222990 loss: 0.964241 +RANK_0 - 2026-01-29 03:27:14,784 - TRAIN-LOGGER - INFO - Epoch 841 - TRAIN - Minibatch 0: weight_norm_model: 143.886536 loss: 0.964241 grad_norm_before_clip: 4.378076 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:15,946 - TRAIN-LOGGER - INFO - Epoch 841 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886536 weight_norm_u: 25.218954 loss: 0.964241 grad_norm_before_clip: 4.378076 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:15,946 - TRAIN-LOGGER - INFO - Epoch 841 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886536 weight_norm_u: 25.222990 loss: 0.965491 +RANK_0 - 2026-01-29 03:27:20,627 - TRAIN-LOGGER - INFO - Epoch 842 - TRAIN - Minibatch 0: weight_norm_model: 143.886536 loss: 0.965491 grad_norm_before_clip: 6.837598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:21,754 - TRAIN-LOGGER - INFO - Epoch 842 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886536 weight_norm_u: 25.218954 loss: 0.965491 grad_norm_before_clip: 6.837598 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:21,754 - TRAIN-LOGGER - INFO - Epoch 842 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886536 weight_norm_u: 25.222990 loss: 0.962058 +RANK_0 - 2026-01-29 03:27:26,005 - TRAIN-LOGGER - INFO - Epoch 843 - TRAIN - Minibatch 0: weight_norm_model: 143.886536 loss: 0.962058 grad_norm_before_clip: 3.975091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:27,177 - TRAIN-LOGGER - INFO - Epoch 843 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886536 weight_norm_u: 25.218954 loss: 0.962058 grad_norm_before_clip: 3.975091 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:27,177 - TRAIN-LOGGER - INFO - Epoch 843 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886536 weight_norm_u: 25.222990 loss: 0.962271 +RANK_0 - 2026-01-29 03:27:31,608 - TRAIN-LOGGER - INFO - Epoch 844 - TRAIN - Minibatch 0: weight_norm_model: 143.886536 loss: 0.962271 grad_norm_before_clip: 3.247217 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:32,751 - TRAIN-LOGGER - INFO - Epoch 844 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886536 weight_norm_u: 25.218954 loss: 0.962271 grad_norm_before_clip: 3.247217 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:32,751 - TRAIN-LOGGER - INFO - Epoch 844 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886551 weight_norm_u: 25.222990 loss: 0.962087 +RANK_0 - 2026-01-29 03:27:37,222 - TRAIN-LOGGER - INFO - Epoch 845 - TRAIN - Minibatch 0: weight_norm_model: 143.886551 loss: 0.962087 grad_norm_before_clip: 3.768978 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:38,456 - TRAIN-LOGGER - INFO - Epoch 845 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886551 weight_norm_u: 25.218954 loss: 0.962087 grad_norm_before_clip: 3.768978 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:38,456 - TRAIN-LOGGER - INFO - Epoch 845 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886551 weight_norm_u: 25.222990 loss: 0.960476 +RANK_0 - 2026-01-29 03:27:43,747 - TRAIN-LOGGER - INFO - Epoch 846 - TRAIN - Minibatch 0: weight_norm_model: 143.886551 loss: 0.960476 grad_norm_before_clip: 1.632504 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:45,014 - TRAIN-LOGGER - INFO - Epoch 846 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886551 weight_norm_u: 25.218954 loss: 0.960476 grad_norm_before_clip: 1.632504 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:45,014 - TRAIN-LOGGER - INFO - Epoch 846 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886551 weight_norm_u: 25.222990 loss: 0.965349 +RANK_0 - 2026-01-29 03:27:49,644 - TRAIN-LOGGER - INFO - Epoch 847 - TRAIN - Minibatch 0: weight_norm_model: 143.886551 loss: 0.965349 grad_norm_before_clip: 4.779789 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:50,780 - TRAIN-LOGGER - INFO - Epoch 847 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886551 weight_norm_u: 25.218954 loss: 0.965349 grad_norm_before_clip: 4.779789 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:50,780 - TRAIN-LOGGER - INFO - Epoch 847 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886551 weight_norm_u: 25.222990 loss: 0.967093 +RANK_0 - 2026-01-29 03:27:56,050 - TRAIN-LOGGER - INFO - Epoch 848 - TRAIN - Minibatch 0: weight_norm_model: 143.886551 loss: 0.967093 grad_norm_before_clip: 5.336350 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:57,189 - TRAIN-LOGGER - INFO - Epoch 848 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886551 weight_norm_u: 25.218954 loss: 0.967093 grad_norm_before_clip: 5.336350 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:27:57,189 - TRAIN-LOGGER - INFO - Epoch 848 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886551 weight_norm_u: 25.222990 loss: 0.963176 +RANK_0 - 2026-01-29 03:28:01,977 - TRAIN-LOGGER - INFO - Epoch 849 - TRAIN - Minibatch 0: weight_norm_model: 143.886551 loss: 0.963176 grad_norm_before_clip: 3.773800 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:03,134 - TRAIN-LOGGER - INFO - Epoch 849 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886551 weight_norm_u: 25.218954 loss: 0.963176 grad_norm_before_clip: 3.773800 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:03,135 - TRAIN-LOGGER - INFO - Epoch 849 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886551 weight_norm_u: 25.222990 loss: 0.961179 +RANK_0 - 2026-01-29 03:28:08,087 - TRAIN-LOGGER - INFO - Epoch 850 - TRAIN - Minibatch 0: weight_norm_model: 143.886551 loss: 0.961179 grad_norm_before_clip: 1.306906 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:09,256 - TRAIN-LOGGER - INFO - Epoch 850 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886551 weight_norm_u: 25.218954 loss: 0.961179 grad_norm_before_clip: 1.306906 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:09,256 - TRAIN-LOGGER - INFO - Epoch 850 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886566 weight_norm_u: 25.222990 loss: 0.962354 +RANK_0 - 2026-01-29 03:28:14,275 - TRAIN-LOGGER - INFO - Epoch 851 - TRAIN - Minibatch 0: weight_norm_model: 143.886566 loss: 0.962354 grad_norm_before_clip: 3.554029 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:15,464 - TRAIN-LOGGER - INFO - Epoch 851 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886566 weight_norm_u: 25.218954 loss: 0.962354 grad_norm_before_clip: 3.554029 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:15,464 - TRAIN-LOGGER - INFO - Epoch 851 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886566 weight_norm_u: 25.222990 loss: 0.960626 +RANK_0 - 2026-01-29 03:28:20,484 - TRAIN-LOGGER - INFO - Epoch 852 - TRAIN - Minibatch 0: weight_norm_model: 143.886566 loss: 0.960626 grad_norm_before_clip: 2.148376 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:21,831 - TRAIN-LOGGER - INFO - Epoch 852 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886566 weight_norm_u: 25.218954 loss: 0.960626 grad_norm_before_clip: 2.148376 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:21,831 - TRAIN-LOGGER - INFO - Epoch 852 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886566 weight_norm_u: 25.222990 loss: 0.962089 +RANK_0 - 2026-01-29 03:28:27,693 - TRAIN-LOGGER - INFO - Epoch 853 - TRAIN - Minibatch 0: weight_norm_model: 143.886566 loss: 0.962089 grad_norm_before_clip: 3.036093 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:28,922 - TRAIN-LOGGER - INFO - Epoch 853 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886566 weight_norm_u: 25.218954 loss: 0.962089 grad_norm_before_clip: 3.036093 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:28,922 - TRAIN-LOGGER - INFO - Epoch 853 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886566 weight_norm_u: 25.222990 loss: 0.963805 +RANK_0 - 2026-01-29 03:28:34,355 - TRAIN-LOGGER - INFO - Epoch 854 - TRAIN - Minibatch 0: weight_norm_model: 143.886566 loss: 0.963805 grad_norm_before_clip: 3.403788 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:35,678 - TRAIN-LOGGER - INFO - Epoch 854 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886566 weight_norm_u: 25.218954 loss: 0.963805 grad_norm_before_clip: 3.403788 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:35,678 - TRAIN-LOGGER - INFO - Epoch 854 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886581 weight_norm_u: 25.222990 loss: 0.962338 +RANK_0 - 2026-01-29 03:28:40,442 - TRAIN-LOGGER - INFO - Epoch 855 - TRAIN - Minibatch 0: weight_norm_model: 143.886581 loss: 0.962338 grad_norm_before_clip: 1.977132 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:41,579 - TRAIN-LOGGER - INFO - Epoch 855 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886581 weight_norm_u: 25.218954 loss: 0.962338 grad_norm_before_clip: 1.977132 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:41,579 - TRAIN-LOGGER - INFO - Epoch 855 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886597 weight_norm_u: 25.222990 loss: 0.962734 +RANK_0 - 2026-01-29 03:28:46,473 - TRAIN-LOGGER - INFO - Epoch 856 - TRAIN - Minibatch 0: weight_norm_model: 143.886597 loss: 0.962734 grad_norm_before_clip: 3.781238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:47,707 - TRAIN-LOGGER - INFO - Epoch 856 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886597 weight_norm_u: 25.218954 loss: 0.962734 grad_norm_before_clip: 3.781238 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:47,707 - TRAIN-LOGGER - INFO - Epoch 856 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886612 weight_norm_u: 25.222990 loss: 0.963276 +RANK_0 - 2026-01-29 03:28:52,343 - TRAIN-LOGGER - INFO - Epoch 857 - TRAIN - Minibatch 0: weight_norm_model: 143.886612 loss: 0.963276 grad_norm_before_clip: 3.431192 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:53,472 - TRAIN-LOGGER - INFO - Epoch 857 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886612 weight_norm_u: 25.218954 loss: 0.963276 grad_norm_before_clip: 3.431192 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:28:53,472 - TRAIN-LOGGER - INFO - Epoch 857 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886627 weight_norm_u: 25.222990 loss: 0.960622 +RANK_0 - 2026-01-29 03:28:58,633 - TRAIN-LOGGER - INFO - Epoch 858 - TRAIN - Minibatch 0: weight_norm_model: 143.886627 loss: 0.960622 grad_norm_before_clip: 2.477742 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:00,062 - TRAIN-LOGGER - INFO - Epoch 858 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886627 weight_norm_u: 25.218954 loss: 0.960622 grad_norm_before_clip: 2.477742 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:00,062 - TRAIN-LOGGER - INFO - Epoch 858 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886612 weight_norm_u: 25.222990 loss: 0.961506 +RANK_0 - 2026-01-29 03:29:04,809 - TRAIN-LOGGER - INFO - Epoch 859 - TRAIN - Minibatch 0: weight_norm_model: 143.886612 loss: 0.961506 grad_norm_before_clip: 4.418737 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:06,212 - TRAIN-LOGGER - INFO - Epoch 859 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886612 weight_norm_u: 25.218954 loss: 0.961506 grad_norm_before_clip: 4.418737 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:06,212 - TRAIN-LOGGER - INFO - Epoch 859 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886612 weight_norm_u: 25.222990 loss: 0.963111 +RANK_0 - 2026-01-29 03:29:11,808 - TRAIN-LOGGER - INFO - Epoch 860 - TRAIN - Minibatch 0: weight_norm_model: 143.886612 loss: 0.963111 grad_norm_before_clip: 4.125882 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:13,207 - TRAIN-LOGGER - INFO - Epoch 860 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886612 weight_norm_u: 25.218954 loss: 0.963111 grad_norm_before_clip: 4.125882 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:13,208 - TRAIN-LOGGER - INFO - Epoch 860 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886627 weight_norm_u: 25.222990 loss: 0.965509 +RANK_0 - 2026-01-29 03:29:18,010 - TRAIN-LOGGER - INFO - Epoch 861 - TRAIN - Minibatch 0: weight_norm_model: 143.886627 loss: 0.965509 grad_norm_before_clip: 5.076860 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:19,202 - TRAIN-LOGGER - INFO - Epoch 861 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886627 weight_norm_u: 25.218954 loss: 0.965509 grad_norm_before_clip: 5.076860 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:19,202 - TRAIN-LOGGER - INFO - Epoch 861 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886642 weight_norm_u: 25.222990 loss: 0.966549 +RANK_0 - 2026-01-29 03:29:23,996 - TRAIN-LOGGER - INFO - Epoch 862 - TRAIN - Minibatch 0: weight_norm_model: 143.886642 loss: 0.966549 grad_norm_before_clip: 5.560348 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:25,186 - TRAIN-LOGGER - INFO - Epoch 862 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886642 weight_norm_u: 25.218954 loss: 0.966549 grad_norm_before_clip: 5.560348 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:25,186 - TRAIN-LOGGER - INFO - Epoch 862 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886658 weight_norm_u: 25.222990 loss: 0.962104 +RANK_0 - 2026-01-29 03:29:29,808 - TRAIN-LOGGER - INFO - Epoch 863 - TRAIN - Minibatch 0: weight_norm_model: 143.886658 loss: 0.962104 grad_norm_before_clip: 3.069925 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:31,002 - TRAIN-LOGGER - INFO - Epoch 863 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886658 weight_norm_u: 25.218954 loss: 0.962104 grad_norm_before_clip: 3.069925 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:31,002 - TRAIN-LOGGER - INFO - Epoch 863 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886673 weight_norm_u: 25.222990 loss: 0.963861 +RANK_0 - 2026-01-29 03:29:36,505 - TRAIN-LOGGER - INFO - Epoch 864 - TRAIN - Minibatch 0: weight_norm_model: 143.886673 loss: 0.963861 grad_norm_before_clip: 4.459061 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:37,744 - TRAIN-LOGGER - INFO - Epoch 864 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886673 weight_norm_u: 25.218954 loss: 0.963861 grad_norm_before_clip: 4.459061 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:37,744 - TRAIN-LOGGER - INFO - Epoch 864 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886673 weight_norm_u: 25.222990 loss: 0.964004 +RANK_0 - 2026-01-29 03:29:42,582 - TRAIN-LOGGER - INFO - Epoch 865 - TRAIN - Minibatch 0: weight_norm_model: 143.886673 loss: 0.964004 grad_norm_before_clip: 4.856890 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:43,779 - TRAIN-LOGGER - INFO - Epoch 865 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886673 weight_norm_u: 25.218954 loss: 0.964004 grad_norm_before_clip: 4.856890 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:43,780 - TRAIN-LOGGER - INFO - Epoch 865 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886658 weight_norm_u: 25.222990 loss: 0.960816 +RANK_0 - 2026-01-29 03:29:48,967 - TRAIN-LOGGER - INFO - Epoch 866 - TRAIN - Minibatch 0: weight_norm_model: 143.886658 loss: 0.960816 grad_norm_before_clip: 4.003116 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:50,190 - TRAIN-LOGGER - INFO - Epoch 866 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886658 weight_norm_u: 25.218954 loss: 0.960816 grad_norm_before_clip: 4.003116 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:50,190 - TRAIN-LOGGER - INFO - Epoch 866 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886658 weight_norm_u: 25.222990 loss: 0.961341 +RANK_0 - 2026-01-29 03:29:55,188 - TRAIN-LOGGER - INFO - Epoch 867 - TRAIN - Minibatch 0: weight_norm_model: 143.886658 loss: 0.961341 grad_norm_before_clip: 2.597150 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:56,300 - TRAIN-LOGGER - INFO - Epoch 867 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886658 weight_norm_u: 25.218954 loss: 0.961341 grad_norm_before_clip: 2.597150 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:29:56,300 - TRAIN-LOGGER - INFO - Epoch 867 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886658 weight_norm_u: 25.222990 loss: 0.960853 +RANK_0 - 2026-01-29 03:30:00,894 - TRAIN-LOGGER - INFO - Epoch 868 - TRAIN - Minibatch 0: weight_norm_model: 143.886658 loss: 0.960853 grad_norm_before_clip: 2.876990 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:02,063 - TRAIN-LOGGER - INFO - Epoch 868 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886658 weight_norm_u: 25.218954 loss: 0.960853 grad_norm_before_clip: 2.876990 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:02,063 - TRAIN-LOGGER - INFO - Epoch 868 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886658 weight_norm_u: 25.222990 loss: 0.959588 +RANK_0 - 2026-01-29 03:30:06,641 - TRAIN-LOGGER - INFO - Epoch 869 - TRAIN - Minibatch 0: weight_norm_model: 143.886658 loss: 0.959588 grad_norm_before_clip: 2.015934 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:07,842 - TRAIN-LOGGER - INFO - Epoch 869 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886658 weight_norm_u: 25.218954 loss: 0.959588 grad_norm_before_clip: 2.015934 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:07,842 - TRAIN-LOGGER - INFO - Epoch 869 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886673 weight_norm_u: 25.222990 loss: 0.959645 +RANK_0 - 2026-01-29 03:30:12,014 - TRAIN-LOGGER - INFO - Epoch 870 - TRAIN - Minibatch 0: weight_norm_model: 143.886673 loss: 0.959645 grad_norm_before_clip: 1.150997 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:13,164 - TRAIN-LOGGER - INFO - Epoch 870 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886673 weight_norm_u: 25.218954 loss: 0.959645 grad_norm_before_clip: 1.150997 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:13,164 - TRAIN-LOGGER - INFO - Epoch 870 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886688 weight_norm_u: 25.222990 loss: 0.959500 +RANK_0 - 2026-01-29 03:30:18,023 - TRAIN-LOGGER - INFO - Epoch 871 - TRAIN - Minibatch 0: weight_norm_model: 143.886688 loss: 0.959500 grad_norm_before_clip: 1.875716 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:19,284 - TRAIN-LOGGER - INFO - Epoch 871 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886688 weight_norm_u: 25.218954 loss: 0.959500 grad_norm_before_clip: 1.875716 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:19,284 - TRAIN-LOGGER - INFO - Epoch 871 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886688 weight_norm_u: 25.222990 loss: 0.962173 +RANK_0 - 2026-01-29 03:30:23,765 - TRAIN-LOGGER - INFO - Epoch 872 - TRAIN - Minibatch 0: weight_norm_model: 143.886688 loss: 0.962173 grad_norm_before_clip: 3.394931 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:25,035 - TRAIN-LOGGER - INFO - Epoch 872 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886688 weight_norm_u: 25.218954 loss: 0.962173 grad_norm_before_clip: 3.394931 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:25,036 - TRAIN-LOGGER - INFO - Epoch 872 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886703 weight_norm_u: 25.222990 loss: 0.963057 +RANK_0 - 2026-01-29 03:30:29,598 - TRAIN-LOGGER - INFO - Epoch 873 - TRAIN - Minibatch 0: weight_norm_model: 143.886703 loss: 0.963057 grad_norm_before_clip: 3.624943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:30,818 - TRAIN-LOGGER - INFO - Epoch 873 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886703 weight_norm_u: 25.218954 loss: 0.963057 grad_norm_before_clip: 3.624943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:30,818 - TRAIN-LOGGER - INFO - Epoch 873 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886719 weight_norm_u: 25.222990 loss: 0.960308 +RANK_0 - 2026-01-29 03:30:35,671 - TRAIN-LOGGER - INFO - Epoch 874 - TRAIN - Minibatch 0: weight_norm_model: 143.886719 loss: 0.960308 grad_norm_before_clip: 1.636766 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:36,898 - TRAIN-LOGGER - INFO - Epoch 874 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886719 weight_norm_u: 25.218954 loss: 0.960308 grad_norm_before_clip: 1.636766 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:36,898 - TRAIN-LOGGER - INFO - Epoch 874 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886734 weight_norm_u: 25.222990 loss: 0.963923 +RANK_0 - 2026-01-29 03:30:41,882 - TRAIN-LOGGER - INFO - Epoch 875 - TRAIN - Minibatch 0: weight_norm_model: 143.886734 loss: 0.963923 grad_norm_before_clip: 3.886873 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:43,025 - TRAIN-LOGGER - INFO - Epoch 875 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886734 weight_norm_u: 25.218954 loss: 0.963923 grad_norm_before_clip: 3.886873 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:43,025 - TRAIN-LOGGER - INFO - Epoch 875 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886749 weight_norm_u: 25.222990 loss: 0.966889 +RANK_0 - 2026-01-29 03:30:47,829 - TRAIN-LOGGER - INFO - Epoch 876 - TRAIN - Minibatch 0: weight_norm_model: 143.886749 loss: 0.966889 grad_norm_before_clip: 3.758623 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:49,024 - TRAIN-LOGGER - INFO - Epoch 876 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886749 weight_norm_u: 25.218954 loss: 0.966889 grad_norm_before_clip: 3.758623 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:49,025 - TRAIN-LOGGER - INFO - Epoch 876 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886749 weight_norm_u: 25.222990 loss: 0.962415 +RANK_0 - 2026-01-29 03:30:53,662 - TRAIN-LOGGER - INFO - Epoch 877 - TRAIN - Minibatch 0: weight_norm_model: 143.886749 loss: 0.962415 grad_norm_before_clip: 3.389209 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:54,813 - TRAIN-LOGGER - INFO - Epoch 877 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886749 weight_norm_u: 25.218954 loss: 0.962415 grad_norm_before_clip: 3.389209 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:30:54,814 - TRAIN-LOGGER - INFO - Epoch 877 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886749 weight_norm_u: 25.222990 loss: 0.962065 +RANK_0 - 2026-01-29 03:30:59,036 - TRAIN-LOGGER - INFO - Epoch 878 - TRAIN - Minibatch 0: weight_norm_model: 143.886749 loss: 0.962065 grad_norm_before_clip: 4.174994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:00,424 - TRAIN-LOGGER - INFO - Epoch 878 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886749 weight_norm_u: 25.218954 loss: 0.962065 grad_norm_before_clip: 4.174994 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:00,425 - TRAIN-LOGGER - INFO - Epoch 878 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886765 weight_norm_u: 25.222990 loss: 0.962465 +RANK_0 - 2026-01-29 03:31:06,249 - TRAIN-LOGGER - INFO - Epoch 879 - TRAIN - Minibatch 0: weight_norm_model: 143.886765 loss: 0.962465 grad_norm_before_clip: 3.623915 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:07,425 - TRAIN-LOGGER - INFO - Epoch 879 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886765 weight_norm_u: 25.218954 loss: 0.962465 grad_norm_before_clip: 3.623915 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:07,425 - TRAIN-LOGGER - INFO - Epoch 879 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886780 weight_norm_u: 25.222990 loss: 0.961778 +RANK_0 - 2026-01-29 03:31:12,886 - TRAIN-LOGGER - INFO - Epoch 880 - TRAIN - Minibatch 0: weight_norm_model: 143.886780 loss: 0.961778 grad_norm_before_clip: 2.302747 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:14,100 - TRAIN-LOGGER - INFO - Epoch 880 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886780 weight_norm_u: 25.218954 loss: 0.961778 grad_norm_before_clip: 2.302747 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:14,101 - TRAIN-LOGGER - INFO - Epoch 880 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886780 weight_norm_u: 25.222990 loss: 0.960100 +RANK_0 - 2026-01-29 03:31:20,638 - TRAIN-LOGGER - INFO - Epoch 881 - TRAIN - Minibatch 0: weight_norm_model: 143.886780 loss: 0.960100 grad_norm_before_clip: 1.565216 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:21,878 - TRAIN-LOGGER - INFO - Epoch 881 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886780 weight_norm_u: 25.218954 loss: 0.960100 grad_norm_before_clip: 1.565216 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:21,879 - TRAIN-LOGGER - INFO - Epoch 881 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886795 weight_norm_u: 25.222990 loss: 0.963022 +RANK_0 - 2026-01-29 03:31:27,407 - TRAIN-LOGGER - INFO - Epoch 882 - TRAIN - Minibatch 0: weight_norm_model: 143.886795 loss: 0.963022 grad_norm_before_clip: 4.624092 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:28,734 - TRAIN-LOGGER - INFO - Epoch 882 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886795 weight_norm_u: 25.218954 loss: 0.963022 grad_norm_before_clip: 4.624092 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:28,734 - TRAIN-LOGGER - INFO - Epoch 882 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886795 weight_norm_u: 25.222990 loss: 0.962418 +RANK_0 - 2026-01-29 03:31:33,596 - TRAIN-LOGGER - INFO - Epoch 883 - TRAIN - Minibatch 0: weight_norm_model: 143.886795 loss: 0.962418 grad_norm_before_clip: 2.917054 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:34,999 - TRAIN-LOGGER - INFO - Epoch 883 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886795 weight_norm_u: 25.218954 loss: 0.962418 grad_norm_before_clip: 2.917054 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:34,999 - TRAIN-LOGGER - INFO - Epoch 883 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886795 weight_norm_u: 25.222990 loss: 0.963943 +RANK_0 - 2026-01-29 03:31:39,991 - TRAIN-LOGGER - INFO - Epoch 884 - TRAIN - Minibatch 0: weight_norm_model: 143.886795 loss: 0.963943 grad_norm_before_clip: 3.400824 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:41,256 - TRAIN-LOGGER - INFO - Epoch 884 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886795 weight_norm_u: 25.218954 loss: 0.963943 grad_norm_before_clip: 3.400824 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:41,256 - TRAIN-LOGGER - INFO - Epoch 884 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886795 weight_norm_u: 25.222990 loss: 0.962315 +RANK_0 - 2026-01-29 03:31:46,179 - TRAIN-LOGGER - INFO - Epoch 885 - TRAIN - Minibatch 0: weight_norm_model: 143.886795 loss: 0.962315 grad_norm_before_clip: 4.132391 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:47,368 - TRAIN-LOGGER - INFO - Epoch 885 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886795 weight_norm_u: 25.218954 loss: 0.962315 grad_norm_before_clip: 4.132391 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:47,369 - TRAIN-LOGGER - INFO - Epoch 885 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886795 weight_norm_u: 25.222990 loss: 0.959587 +RANK_0 - 2026-01-29 03:31:52,024 - TRAIN-LOGGER - INFO - Epoch 886 - TRAIN - Minibatch 0: weight_norm_model: 143.886795 loss: 0.959587 grad_norm_before_clip: 1.385040 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:53,499 - TRAIN-LOGGER - INFO - Epoch 886 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886795 weight_norm_u: 25.218954 loss: 0.959587 grad_norm_before_clip: 1.385040 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:31:53,500 - TRAIN-LOGGER - INFO - Epoch 886 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886810 weight_norm_u: 25.222990 loss: 0.961163 +RANK_0 - 2026-01-29 03:31:59,051 - TRAIN-LOGGER - INFO - Epoch 887 - TRAIN - Minibatch 0: weight_norm_model: 143.886810 loss: 0.961163 grad_norm_before_clip: 3.907132 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:00,269 - TRAIN-LOGGER - INFO - Epoch 887 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886810 weight_norm_u: 25.218954 loss: 0.961163 grad_norm_before_clip: 3.907132 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:00,269 - TRAIN-LOGGER - INFO - Epoch 887 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886826 weight_norm_u: 25.222990 loss: 0.961568 +RANK_0 - 2026-01-29 03:32:05,274 - TRAIN-LOGGER - INFO - Epoch 888 - TRAIN - Minibatch 0: weight_norm_model: 143.886826 loss: 0.961568 grad_norm_before_clip: 2.123415 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:06,537 - TRAIN-LOGGER - INFO - Epoch 888 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886826 weight_norm_u: 25.218954 loss: 0.961568 grad_norm_before_clip: 2.123415 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:06,538 - TRAIN-LOGGER - INFO - Epoch 888 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886841 weight_norm_u: 25.222990 loss: 0.961578 +RANK_0 - 2026-01-29 03:32:11,100 - TRAIN-LOGGER - INFO - Epoch 889 - TRAIN - Minibatch 0: weight_norm_model: 143.886841 loss: 0.961578 grad_norm_before_clip: 1.575665 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:12,557 - TRAIN-LOGGER - INFO - Epoch 889 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886841 weight_norm_u: 25.218954 loss: 0.961578 grad_norm_before_clip: 1.575665 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:12,557 - TRAIN-LOGGER - INFO - Epoch 889 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886826 weight_norm_u: 25.222990 loss: 0.962269 +RANK_0 - 2026-01-29 03:32:17,091 - TRAIN-LOGGER - INFO - Epoch 890 - TRAIN - Minibatch 0: weight_norm_model: 143.886826 loss: 0.962269 grad_norm_before_clip: 2.599125 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:18,379 - TRAIN-LOGGER - INFO - Epoch 890 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886826 weight_norm_u: 25.218954 loss: 0.962269 grad_norm_before_clip: 2.599125 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:18,380 - TRAIN-LOGGER - INFO - Epoch 890 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886841 weight_norm_u: 25.222990 loss: 0.960448 +RANK_0 - 2026-01-29 03:32:23,614 - TRAIN-LOGGER - INFO - Epoch 891 - TRAIN - Minibatch 0: weight_norm_model: 143.886841 loss: 0.960448 grad_norm_before_clip: 2.616516 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:24,786 - TRAIN-LOGGER - INFO - Epoch 891 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886841 weight_norm_u: 25.218954 loss: 0.960448 grad_norm_before_clip: 2.616516 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:24,786 - TRAIN-LOGGER - INFO - Epoch 891 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886856 weight_norm_u: 25.222990 loss: 0.964894 +RANK_0 - 2026-01-29 03:32:29,818 - TRAIN-LOGGER - INFO - Epoch 892 - TRAIN - Minibatch 0: weight_norm_model: 143.886856 loss: 0.964894 grad_norm_before_clip: 3.261361 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:31,031 - TRAIN-LOGGER - INFO - Epoch 892 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886856 weight_norm_u: 25.218954 loss: 0.964894 grad_norm_before_clip: 3.261361 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:31,032 - TRAIN-LOGGER - INFO - Epoch 892 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886856 weight_norm_u: 25.222990 loss: 0.964475 +RANK_0 - 2026-01-29 03:32:36,937 - TRAIN-LOGGER - INFO - Epoch 893 - TRAIN - Minibatch 0: weight_norm_model: 143.886856 loss: 0.964475 grad_norm_before_clip: 3.480285 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:38,422 - TRAIN-LOGGER - INFO - Epoch 893 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886856 weight_norm_u: 25.218954 loss: 0.964475 grad_norm_before_clip: 3.480285 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:38,422 - TRAIN-LOGGER - INFO - Epoch 893 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.962495 +RANK_0 - 2026-01-29 03:32:44,011 - TRAIN-LOGGER - INFO - Epoch 894 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.962495 grad_norm_before_clip: 1.437302 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:45,256 - TRAIN-LOGGER - INFO - Epoch 894 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.962495 grad_norm_before_clip: 1.437302 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:45,257 - TRAIN-LOGGER - INFO - Epoch 894 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.962235 +RANK_0 - 2026-01-29 03:32:50,420 - TRAIN-LOGGER - INFO - Epoch 895 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.962235 grad_norm_before_clip: 4.597721 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:51,551 - TRAIN-LOGGER - INFO - Epoch 895 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.962235 grad_norm_before_clip: 4.597721 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:51,551 - TRAIN-LOGGER - INFO - Epoch 895 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.961873 +RANK_0 - 2026-01-29 03:32:56,239 - TRAIN-LOGGER - INFO - Epoch 896 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.961873 grad_norm_before_clip: 4.589036 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:57,449 - TRAIN-LOGGER - INFO - Epoch 896 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.961873 grad_norm_before_clip: 4.589036 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:32:57,449 - TRAIN-LOGGER - INFO - Epoch 896 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.961742 +RANK_0 - 2026-01-29 03:33:02,493 - TRAIN-LOGGER - INFO - Epoch 897 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.961742 grad_norm_before_clip: 1.913543 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:03,635 - TRAIN-LOGGER - INFO - Epoch 897 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.961742 grad_norm_before_clip: 1.913543 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:03,635 - TRAIN-LOGGER - INFO - Epoch 897 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886887 weight_norm_u: 25.222990 loss: 0.963205 +RANK_0 - 2026-01-29 03:33:08,399 - TRAIN-LOGGER - INFO - Epoch 898 - TRAIN - Minibatch 0: weight_norm_model: 143.886887 loss: 0.963205 grad_norm_before_clip: 2.979088 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:09,659 - TRAIN-LOGGER - INFO - Epoch 898 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886887 weight_norm_u: 25.218954 loss: 0.963205 grad_norm_before_clip: 2.979088 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:09,659 - TRAIN-LOGGER - INFO - Epoch 898 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886902 weight_norm_u: 25.222990 loss: 0.963590 +RANK_0 - 2026-01-29 03:33:14,806 - TRAIN-LOGGER - INFO - Epoch 899 - TRAIN - Minibatch 0: weight_norm_model: 143.886902 loss: 0.963590 grad_norm_before_clip: 2.574538 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:16,199 - TRAIN-LOGGER - INFO - Epoch 899 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886902 weight_norm_u: 25.218954 loss: 0.963590 grad_norm_before_clip: 2.574538 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:16,199 - TRAIN-LOGGER - INFO - Epoch 899 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886902 weight_norm_u: 25.222990 loss: 0.959724 +RANK_0 - 2026-01-29 03:33:21,080 - TRAIN-LOGGER - INFO - Epoch 900 - TRAIN - Minibatch 0: weight_norm_model: 143.886902 loss: 0.959724 grad_norm_before_clip: 2.365716 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:22,217 - TRAIN-LOGGER - INFO - Epoch 900 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886902 weight_norm_u: 25.218954 loss: 0.959724 grad_norm_before_clip: 2.365716 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:22,217 - TRAIN-LOGGER - INFO - Epoch 900 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.963125 +RANK_0 - 2026-01-29 03:33:27,718 - TRAIN-LOGGER - INFO - Epoch 901 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.963125 grad_norm_before_clip: 3.783918 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:28,888 - TRAIN-LOGGER - INFO - Epoch 901 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.963125 grad_norm_before_clip: 3.783918 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:28,889 - TRAIN-LOGGER - INFO - Epoch 901 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.964609 +RANK_0 - 2026-01-29 03:33:33,707 - TRAIN-LOGGER - INFO - Epoch 902 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.964609 grad_norm_before_clip: 3.885970 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:34,889 - TRAIN-LOGGER - INFO - Epoch 902 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.964609 grad_norm_before_clip: 3.885970 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:34,890 - TRAIN-LOGGER - INFO - Epoch 902 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886871 weight_norm_u: 25.222990 loss: 0.962360 +RANK_0 - 2026-01-29 03:33:40,239 - TRAIN-LOGGER - INFO - Epoch 903 - TRAIN - Minibatch 0: weight_norm_model: 143.886871 loss: 0.962360 grad_norm_before_clip: 2.646041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:41,394 - TRAIN-LOGGER - INFO - Epoch 903 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886871 weight_norm_u: 25.218954 loss: 0.962360 grad_norm_before_clip: 2.646041 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:41,394 - TRAIN-LOGGER - INFO - Epoch 903 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886902 weight_norm_u: 25.222990 loss: 0.960665 +RANK_0 - 2026-01-29 03:33:46,402 - TRAIN-LOGGER - INFO - Epoch 904 - TRAIN - Minibatch 0: weight_norm_model: 143.886902 loss: 0.960665 grad_norm_before_clip: 3.243022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:47,581 - TRAIN-LOGGER - INFO - Epoch 904 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886902 weight_norm_u: 25.218954 loss: 0.960665 grad_norm_before_clip: 3.243022 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:47,581 - TRAIN-LOGGER - INFO - Epoch 904 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.961033 +RANK_0 - 2026-01-29 03:33:52,417 - TRAIN-LOGGER - INFO - Epoch 905 - TRAIN - Minibatch 0: weight_norm_model: 143.886917 loss: 0.961033 grad_norm_before_clip: 2.312501 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:53,563 - TRAIN-LOGGER - INFO - Epoch 905 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886917 weight_norm_u: 25.218954 loss: 0.961033 grad_norm_before_clip: 2.312501 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:33:53,564 - TRAIN-LOGGER - INFO - Epoch 905 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886932 weight_norm_u: 25.222990 loss: 0.960592 +RANK_0 - 2026-01-29 03:33:59,435 - TRAIN-LOGGER - INFO - Epoch 906 - TRAIN - Minibatch 0: weight_norm_model: 143.886932 loss: 0.960592 grad_norm_before_clip: 2.424163 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:00,608 - TRAIN-LOGGER - INFO - Epoch 906 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886932 weight_norm_u: 25.218954 loss: 0.960592 grad_norm_before_clip: 2.424163 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:00,609 - TRAIN-LOGGER - INFO - Epoch 906 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.960526 +RANK_0 - 2026-01-29 03:34:07,000 - TRAIN-LOGGER - INFO - Epoch 907 - TRAIN - Minibatch 0: weight_norm_model: 143.886917 loss: 0.960526 grad_norm_before_clip: 1.613612 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:08,293 - TRAIN-LOGGER - INFO - Epoch 907 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886917 weight_norm_u: 25.218954 loss: 0.960526 grad_norm_before_clip: 1.613612 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:08,293 - TRAIN-LOGGER - INFO - Epoch 907 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.960030 +RANK_0 - 2026-01-29 03:34:13,945 - TRAIN-LOGGER - INFO - Epoch 908 - TRAIN - Minibatch 0: weight_norm_model: 143.886917 loss: 0.960030 grad_norm_before_clip: 1.758814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:15,184 - TRAIN-LOGGER - INFO - Epoch 908 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886917 weight_norm_u: 25.218954 loss: 0.960030 grad_norm_before_clip: 1.758814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:15,184 - TRAIN-LOGGER - INFO - Epoch 908 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.961262 +RANK_0 - 2026-01-29 03:34:20,382 - TRAIN-LOGGER - INFO - Epoch 909 - TRAIN - Minibatch 0: weight_norm_model: 143.886917 loss: 0.961262 grad_norm_before_clip: 2.634879 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:21,545 - TRAIN-LOGGER - INFO - Epoch 909 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886917 weight_norm_u: 25.218954 loss: 0.961262 grad_norm_before_clip: 2.634879 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:21,545 - TRAIN-LOGGER - INFO - Epoch 909 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886932 weight_norm_u: 25.222990 loss: 0.963191 +RANK_0 - 2026-01-29 03:34:26,210 - TRAIN-LOGGER - INFO - Epoch 910 - TRAIN - Minibatch 0: weight_norm_model: 143.886932 loss: 0.963191 grad_norm_before_clip: 2.581639 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:27,359 - TRAIN-LOGGER - INFO - Epoch 910 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886932 weight_norm_u: 25.218954 loss: 0.963191 grad_norm_before_clip: 2.581639 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:27,359 - TRAIN-LOGGER - INFO - Epoch 910 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.962840 +RANK_0 - 2026-01-29 03:34:31,897 - TRAIN-LOGGER - INFO - Epoch 911 - TRAIN - Minibatch 0: weight_norm_model: 143.886917 loss: 0.962840 grad_norm_before_clip: 2.787203 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:33,047 - TRAIN-LOGGER - INFO - Epoch 911 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886917 weight_norm_u: 25.218954 loss: 0.962840 grad_norm_before_clip: 2.787203 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:33,047 - TRAIN-LOGGER - INFO - Epoch 911 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.963662 +RANK_0 - 2026-01-29 03:34:37,845 - TRAIN-LOGGER - INFO - Epoch 912 - TRAIN - Minibatch 0: weight_norm_model: 143.886917 loss: 0.963662 grad_norm_before_clip: 3.543651 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:39,014 - TRAIN-LOGGER - INFO - Epoch 912 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886917 weight_norm_u: 25.218954 loss: 0.963662 grad_norm_before_clip: 3.543651 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:39,014 - TRAIN-LOGGER - INFO - Epoch 912 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886917 weight_norm_u: 25.222990 loss: 0.963747 +RANK_0 - 2026-01-29 03:34:44,227 - TRAIN-LOGGER - INFO - Epoch 913 - TRAIN - Minibatch 0: weight_norm_model: 143.886917 loss: 0.963747 grad_norm_before_clip: 2.144165 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:45,451 - TRAIN-LOGGER - INFO - Epoch 913 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886917 weight_norm_u: 25.218954 loss: 0.963747 grad_norm_before_clip: 2.144165 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:45,451 - TRAIN-LOGGER - INFO - Epoch 913 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886932 weight_norm_u: 25.222990 loss: 0.962063 +RANK_0 - 2026-01-29 03:34:50,673 - TRAIN-LOGGER - INFO - Epoch 914 - TRAIN - Minibatch 0: weight_norm_model: 143.886932 loss: 0.962063 grad_norm_before_clip: 2.370787 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:51,939 - TRAIN-LOGGER - INFO - Epoch 914 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886932 weight_norm_u: 25.218954 loss: 0.962063 grad_norm_before_clip: 2.370787 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:51,939 - TRAIN-LOGGER - INFO - Epoch 914 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886932 weight_norm_u: 25.222990 loss: 0.962240 +RANK_0 - 2026-01-29 03:34:56,865 - TRAIN-LOGGER - INFO - Epoch 915 - TRAIN - Minibatch 0: weight_norm_model: 143.886932 loss: 0.962240 grad_norm_before_clip: 2.424797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:58,070 - TRAIN-LOGGER - INFO - Epoch 915 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886932 weight_norm_u: 25.218954 loss: 0.962240 grad_norm_before_clip: 2.424797 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:34:58,070 - TRAIN-LOGGER - INFO - Epoch 915 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886948 weight_norm_u: 25.222990 loss: 0.961424 +RANK_0 - 2026-01-29 03:35:03,001 - TRAIN-LOGGER - INFO - Epoch 916 - TRAIN - Minibatch 0: weight_norm_model: 143.886948 loss: 0.961424 grad_norm_before_clip: 1.807456 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:04,127 - TRAIN-LOGGER - INFO - Epoch 916 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886948 weight_norm_u: 25.218954 loss: 0.961424 grad_norm_before_clip: 1.807456 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:04,127 - TRAIN-LOGGER - INFO - Epoch 916 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886948 weight_norm_u: 25.222990 loss: 0.961100 +RANK_0 - 2026-01-29 03:35:09,346 - TRAIN-LOGGER - INFO - Epoch 917 - TRAIN - Minibatch 0: weight_norm_model: 143.886948 loss: 0.961100 grad_norm_before_clip: 1.965312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:10,586 - TRAIN-LOGGER - INFO - Epoch 917 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886948 weight_norm_u: 25.218954 loss: 0.961100 grad_norm_before_clip: 1.965312 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:10,586 - TRAIN-LOGGER - INFO - Epoch 917 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886948 weight_norm_u: 25.222990 loss: 0.962944 +RANK_0 - 2026-01-29 03:35:15,843 - TRAIN-LOGGER - INFO - Epoch 918 - TRAIN - Minibatch 0: weight_norm_model: 143.886948 loss: 0.962944 grad_norm_before_clip: 4.092215 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:17,116 - TRAIN-LOGGER - INFO - Epoch 918 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886948 weight_norm_u: 25.218954 loss: 0.962944 grad_norm_before_clip: 4.092215 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:17,116 - TRAIN-LOGGER - INFO - Epoch 918 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886963 weight_norm_u: 25.222990 loss: 0.961990 +RANK_0 - 2026-01-29 03:35:21,932 - TRAIN-LOGGER - INFO - Epoch 919 - TRAIN - Minibatch 0: weight_norm_model: 143.886963 loss: 0.961990 grad_norm_before_clip: 3.442432 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:23,182 - TRAIN-LOGGER - INFO - Epoch 919 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886963 weight_norm_u: 25.218954 loss: 0.961990 grad_norm_before_clip: 3.442432 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:23,182 - TRAIN-LOGGER - INFO - Epoch 919 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886978 weight_norm_u: 25.222990 loss: 0.961178 +RANK_0 - 2026-01-29 03:35:28,464 - TRAIN-LOGGER - INFO - Epoch 920 - TRAIN - Minibatch 0: weight_norm_model: 143.886978 loss: 0.961178 grad_norm_before_clip: 2.913368 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:29,596 - TRAIN-LOGGER - INFO - Epoch 920 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886978 weight_norm_u: 25.218954 loss: 0.961178 grad_norm_before_clip: 2.913368 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:29,596 - TRAIN-LOGGER - INFO - Epoch 920 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886993 weight_norm_u: 25.222990 loss: 0.960342 +RANK_0 - 2026-01-29 03:35:34,574 - TRAIN-LOGGER - INFO - Epoch 921 - TRAIN - Minibatch 0: weight_norm_model: 143.886993 loss: 0.960342 grad_norm_before_clip: 1.684354 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:35,810 - TRAIN-LOGGER - INFO - Epoch 921 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886993 weight_norm_u: 25.218954 loss: 0.960342 grad_norm_before_clip: 1.684354 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:35,810 - TRAIN-LOGGER - INFO - Epoch 921 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886993 weight_norm_u: 25.222990 loss: 0.962363 +RANK_0 - 2026-01-29 03:35:40,801 - TRAIN-LOGGER - INFO - Epoch 922 - TRAIN - Minibatch 0: weight_norm_model: 143.886993 loss: 0.962363 grad_norm_before_clip: 4.057831 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:42,007 - TRAIN-LOGGER - INFO - Epoch 922 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886993 weight_norm_u: 25.218954 loss: 0.962363 grad_norm_before_clip: 4.057831 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:42,007 - TRAIN-LOGGER - INFO - Epoch 922 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886978 weight_norm_u: 25.222990 loss: 0.961118 +RANK_0 - 2026-01-29 03:35:46,931 - TRAIN-LOGGER - INFO - Epoch 923 - TRAIN - Minibatch 0: weight_norm_model: 143.886978 loss: 0.961118 grad_norm_before_clip: 2.055193 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:48,117 - TRAIN-LOGGER - INFO - Epoch 923 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886978 weight_norm_u: 25.218954 loss: 0.961118 grad_norm_before_clip: 2.055193 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:48,118 - TRAIN-LOGGER - INFO - Epoch 923 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886993 weight_norm_u: 25.222990 loss: 0.960355 +RANK_0 - 2026-01-29 03:35:53,207 - TRAIN-LOGGER - INFO - Epoch 924 - TRAIN - Minibatch 0: weight_norm_model: 143.886993 loss: 0.960355 grad_norm_before_clip: 1.414412 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:54,410 - TRAIN-LOGGER - INFO - Epoch 924 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886993 weight_norm_u: 25.218954 loss: 0.960355 grad_norm_before_clip: 1.414412 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:35:54,410 - TRAIN-LOGGER - INFO - Epoch 924 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886993 weight_norm_u: 25.222990 loss: 0.961179 +RANK_0 - 2026-01-29 03:35:59,384 - TRAIN-LOGGER - INFO - Epoch 925 - TRAIN - Minibatch 0: weight_norm_model: 143.886993 loss: 0.961179 grad_norm_before_clip: 2.571180 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:00,782 - TRAIN-LOGGER - INFO - Epoch 925 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886993 weight_norm_u: 25.218954 loss: 0.961179 grad_norm_before_clip: 2.571180 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:00,782 - TRAIN-LOGGER - INFO - Epoch 925 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.886993 weight_norm_u: 25.222990 loss: 0.962858 +RANK_0 - 2026-01-29 03:36:05,412 - TRAIN-LOGGER - INFO - Epoch 926 - TRAIN - Minibatch 0: weight_norm_model: 143.886993 loss: 0.962858 grad_norm_before_clip: 3.242494 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:06,767 - TRAIN-LOGGER - INFO - Epoch 926 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.886993 weight_norm_u: 25.218954 loss: 0.962858 grad_norm_before_clip: 3.242494 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:06,767 - TRAIN-LOGGER - INFO - Epoch 926 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887024 weight_norm_u: 25.222990 loss: 0.960002 +RANK_0 - 2026-01-29 03:36:11,415 - TRAIN-LOGGER - INFO - Epoch 927 - TRAIN - Minibatch 0: weight_norm_model: 143.887024 loss: 0.960002 grad_norm_before_clip: 2.537240 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:12,762 - TRAIN-LOGGER - INFO - Epoch 927 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887024 weight_norm_u: 25.218954 loss: 0.960002 grad_norm_before_clip: 2.537240 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:12,763 - TRAIN-LOGGER - INFO - Epoch 927 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887054 weight_norm_u: 25.222990 loss: 0.959863 +RANK_0 - 2026-01-29 03:36:17,772 - TRAIN-LOGGER - INFO - Epoch 928 - TRAIN - Minibatch 0: weight_norm_model: 143.887054 loss: 0.959863 grad_norm_before_clip: 2.132746 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:19,162 - TRAIN-LOGGER - INFO - Epoch 928 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887054 weight_norm_u: 25.218954 loss: 0.959863 grad_norm_before_clip: 2.132746 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:19,172 - TRAIN-LOGGER - INFO - Epoch 928 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887054 weight_norm_u: 25.222990 loss: 0.961294 +RANK_0 - 2026-01-29 03:36:24,110 - TRAIN-LOGGER - INFO - Epoch 929 - TRAIN - Minibatch 0: weight_norm_model: 143.887054 loss: 0.961294 grad_norm_before_clip: 2.976191 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:25,603 - TRAIN-LOGGER - INFO - Epoch 929 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887054 weight_norm_u: 25.218954 loss: 0.961294 grad_norm_before_clip: 2.976191 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:25,603 - TRAIN-LOGGER - INFO - Epoch 929 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887070 weight_norm_u: 25.222990 loss: 0.960209 +RANK_0 - 2026-01-29 03:36:30,255 - TRAIN-LOGGER - INFO - Epoch 930 - TRAIN - Minibatch 0: weight_norm_model: 143.887070 loss: 0.960209 grad_norm_before_clip: 1.861522 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:31,888 - TRAIN-LOGGER - INFO - Epoch 930 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887070 weight_norm_u: 25.218954 loss: 0.960209 grad_norm_before_clip: 1.861522 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:31,888 - TRAIN-LOGGER - INFO - Epoch 930 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887070 weight_norm_u: 25.222990 loss: 0.959060 +RANK_0 - 2026-01-29 03:36:37,320 - TRAIN-LOGGER - INFO - Epoch 931 - TRAIN - Minibatch 0: weight_norm_model: 143.887070 loss: 0.959060 grad_norm_before_clip: 1.586545 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:38,549 - TRAIN-LOGGER - INFO - Epoch 931 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887070 weight_norm_u: 25.218954 loss: 0.959060 grad_norm_before_clip: 1.586545 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:38,550 - TRAIN-LOGGER - INFO - Epoch 931 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887070 weight_norm_u: 25.222990 loss: 0.961325 +RANK_0 - 2026-01-29 03:36:43,702 - TRAIN-LOGGER - INFO - Epoch 932 - TRAIN - Minibatch 0: weight_norm_model: 143.887070 loss: 0.961325 grad_norm_before_clip: 2.673699 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:44,874 - TRAIN-LOGGER - INFO - Epoch 932 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887070 weight_norm_u: 25.218954 loss: 0.961325 grad_norm_before_clip: 2.673699 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:44,874 - TRAIN-LOGGER - INFO - Epoch 932 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887085 weight_norm_u: 25.222990 loss: 0.963280 +RANK_0 - 2026-01-29 03:36:49,315 - TRAIN-LOGGER - INFO - Epoch 933 - TRAIN - Minibatch 0: weight_norm_model: 143.887085 loss: 0.963280 grad_norm_before_clip: 2.734359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:50,762 - TRAIN-LOGGER - INFO - Epoch 933 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887085 weight_norm_u: 25.218954 loss: 0.963280 grad_norm_before_clip: 2.734359 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:50,762 - TRAIN-LOGGER - INFO - Epoch 933 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887085 weight_norm_u: 25.222990 loss: 0.960464 +RANK_0 - 2026-01-29 03:36:55,109 - TRAIN-LOGGER - INFO - Epoch 934 - TRAIN - Minibatch 0: weight_norm_model: 143.887085 loss: 0.960464 grad_norm_before_clip: 1.467174 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:56,643 - TRAIN-LOGGER - INFO - Epoch 934 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887085 weight_norm_u: 25.218954 loss: 0.960464 grad_norm_before_clip: 1.467174 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:36:56,643 - TRAIN-LOGGER - INFO - Epoch 934 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887100 weight_norm_u: 25.222990 loss: 0.962673 +RANK_0 - 2026-01-29 03:37:01,561 - TRAIN-LOGGER - INFO - Epoch 935 - TRAIN - Minibatch 0: weight_norm_model: 143.887100 loss: 0.962673 grad_norm_before_clip: 3.608886 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:02,969 - TRAIN-LOGGER - INFO - Epoch 935 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887100 weight_norm_u: 25.218954 loss: 0.962673 grad_norm_before_clip: 3.608886 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:02,969 - TRAIN-LOGGER - INFO - Epoch 935 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887100 weight_norm_u: 25.222990 loss: 0.961667 +RANK_0 - 2026-01-29 03:37:07,581 - TRAIN-LOGGER - INFO - Epoch 936 - TRAIN - Minibatch 0: weight_norm_model: 143.887100 loss: 0.961667 grad_norm_before_clip: 3.332231 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:09,059 - TRAIN-LOGGER - INFO - Epoch 936 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887100 weight_norm_u: 25.218954 loss: 0.961667 grad_norm_before_clip: 3.332231 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:09,060 - TRAIN-LOGGER - INFO - Epoch 936 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887115 weight_norm_u: 25.222990 loss: 0.961376 +RANK_0 - 2026-01-29 03:37:13,916 - TRAIN-LOGGER - INFO - Epoch 937 - TRAIN - Minibatch 0: weight_norm_model: 143.887115 loss: 0.961376 grad_norm_before_clip: 2.299352 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:15,365 - TRAIN-LOGGER - INFO - Epoch 937 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887115 weight_norm_u: 25.218954 loss: 0.961376 grad_norm_before_clip: 2.299352 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:15,366 - TRAIN-LOGGER - INFO - Epoch 937 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887115 weight_norm_u: 25.222990 loss: 0.960941 +RANK_0 - 2026-01-29 03:37:20,075 - TRAIN-LOGGER - INFO - Epoch 938 - TRAIN - Minibatch 0: weight_norm_model: 143.887115 loss: 0.960941 grad_norm_before_clip: 1.953769 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:21,631 - TRAIN-LOGGER - INFO - Epoch 938 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887115 weight_norm_u: 25.218954 loss: 0.960941 grad_norm_before_clip: 1.953769 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:21,631 - TRAIN-LOGGER - INFO - Epoch 938 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887131 weight_norm_u: 25.222990 loss: 0.958695 +RANK_0 - 2026-01-29 03:37:26,613 - TRAIN-LOGGER - INFO - Epoch 939 - TRAIN - Minibatch 0: weight_norm_model: 143.887131 loss: 0.958695 grad_norm_before_clip: 1.589119 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:28,050 - TRAIN-LOGGER - INFO - Epoch 939 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887131 weight_norm_u: 25.218954 loss: 0.958695 grad_norm_before_clip: 1.589119 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:28,051 - TRAIN-LOGGER - INFO - Epoch 939 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887146 weight_norm_u: 25.222990 loss: 0.961134 +RANK_0 - 2026-01-29 03:37:32,788 - TRAIN-LOGGER - INFO - Epoch 940 - TRAIN - Minibatch 0: weight_norm_model: 143.887146 loss: 0.961134 grad_norm_before_clip: 3.626868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:34,209 - TRAIN-LOGGER - INFO - Epoch 940 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887146 weight_norm_u: 25.218954 loss: 0.961134 grad_norm_before_clip: 3.626868 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:34,210 - TRAIN-LOGGER - INFO - Epoch 940 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887146 weight_norm_u: 25.222990 loss: 0.963591 +RANK_0 - 2026-01-29 03:37:38,869 - TRAIN-LOGGER - INFO - Epoch 941 - TRAIN - Minibatch 0: weight_norm_model: 143.887146 loss: 0.963591 grad_norm_before_clip: 2.914194 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:40,132 - TRAIN-LOGGER - INFO - Epoch 941 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887146 weight_norm_u: 25.218954 loss: 0.963591 grad_norm_before_clip: 2.914194 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:40,132 - TRAIN-LOGGER - INFO - Epoch 941 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887161 weight_norm_u: 25.222990 loss: 0.962652 +RANK_0 - 2026-01-29 03:37:44,790 - TRAIN-LOGGER - INFO - Epoch 942 - TRAIN - Minibatch 0: weight_norm_model: 143.887161 loss: 0.962652 grad_norm_before_clip: 3.217615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:46,034 - TRAIN-LOGGER - INFO - Epoch 942 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887161 weight_norm_u: 25.218954 loss: 0.962652 grad_norm_before_clip: 3.217615 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:46,035 - TRAIN-LOGGER - INFO - Epoch 942 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887177 weight_norm_u: 25.222990 loss: 0.959937 +RANK_0 - 2026-01-29 03:37:51,038 - TRAIN-LOGGER - INFO - Epoch 943 - TRAIN - Minibatch 0: weight_norm_model: 143.887177 loss: 0.959937 grad_norm_before_clip: 2.064863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:52,272 - TRAIN-LOGGER - INFO - Epoch 943 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887177 weight_norm_u: 25.218954 loss: 0.959937 grad_norm_before_clip: 2.064863 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:52,272 - TRAIN-LOGGER - INFO - Epoch 943 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887192 weight_norm_u: 25.222990 loss: 0.963530 +RANK_0 - 2026-01-29 03:37:57,389 - TRAIN-LOGGER - INFO - Epoch 944 - TRAIN - Minibatch 0: weight_norm_model: 143.887192 loss: 0.963530 grad_norm_before_clip: 5.019339 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:58,520 - TRAIN-LOGGER - INFO - Epoch 944 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887192 weight_norm_u: 25.218954 loss: 0.963530 grad_norm_before_clip: 5.019339 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:37:58,520 - TRAIN-LOGGER - INFO - Epoch 944 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887222 weight_norm_u: 25.222990 loss: 0.967710 +RANK_0 - 2026-01-29 03:38:04,061 - TRAIN-LOGGER - INFO - Epoch 945 - TRAIN - Minibatch 0: weight_norm_model: 143.887222 loss: 0.967710 grad_norm_before_clip: 6.264490 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:05,306 - TRAIN-LOGGER - INFO - Epoch 945 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887222 weight_norm_u: 25.218954 loss: 0.967710 grad_norm_before_clip: 6.264490 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:05,306 - TRAIN-LOGGER - INFO - Epoch 945 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887238 weight_norm_u: 25.222990 loss: 0.965845 +RANK_0 - 2026-01-29 03:38:09,893 - TRAIN-LOGGER - INFO - Epoch 946 - TRAIN - Minibatch 0: weight_norm_model: 143.887238 loss: 0.965845 grad_norm_before_clip: 4.283548 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:11,038 - TRAIN-LOGGER - INFO - Epoch 946 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887238 weight_norm_u: 25.218954 loss: 0.965845 grad_norm_before_clip: 4.283548 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:11,038 - TRAIN-LOGGER - INFO - Epoch 946 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887238 weight_norm_u: 25.222990 loss: 0.962634 +RANK_0 - 2026-01-29 03:38:15,716 - TRAIN-LOGGER - INFO - Epoch 947 - TRAIN - Minibatch 0: weight_norm_model: 143.887238 loss: 0.962634 grad_norm_before_clip: 1.763221 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:16,863 - TRAIN-LOGGER - INFO - Epoch 947 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887238 weight_norm_u: 25.218954 loss: 0.962634 grad_norm_before_clip: 1.763221 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:16,863 - TRAIN-LOGGER - INFO - Epoch 947 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887238 weight_norm_u: 25.222990 loss: 0.964832 +RANK_0 - 2026-01-29 03:38:21,026 - TRAIN-LOGGER - INFO - Epoch 948 - TRAIN - Minibatch 0: weight_norm_model: 143.887238 loss: 0.964832 grad_norm_before_clip: 3.835352 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:22,458 - TRAIN-LOGGER - INFO - Epoch 948 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887238 weight_norm_u: 25.218954 loss: 0.964832 grad_norm_before_clip: 3.835352 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:22,458 - TRAIN-LOGGER - INFO - Epoch 948 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887238 weight_norm_u: 25.222990 loss: 0.964405 +RANK_0 - 2026-01-29 03:38:27,197 - TRAIN-LOGGER - INFO - Epoch 949 - TRAIN - Minibatch 0: weight_norm_model: 143.887238 loss: 0.964405 grad_norm_before_clip: 3.931897 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:28,541 - TRAIN-LOGGER - INFO - Epoch 949 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887238 weight_norm_u: 25.218954 loss: 0.964405 grad_norm_before_clip: 3.931897 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:28,542 - TRAIN-LOGGER - INFO - Epoch 949 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887238 weight_norm_u: 25.222990 loss: 0.962002 +RANK_0 - 2026-01-29 03:38:33,604 - TRAIN-LOGGER - INFO - Epoch 950 - TRAIN - Minibatch 0: weight_norm_model: 143.887238 loss: 0.962002 grad_norm_before_clip: 2.183112 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:34,837 - TRAIN-LOGGER - INFO - Epoch 950 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887238 weight_norm_u: 25.218954 loss: 0.962002 grad_norm_before_clip: 2.183112 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:34,837 - TRAIN-LOGGER - INFO - Epoch 950 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887268 weight_norm_u: 25.222990 loss: 0.960864 +RANK_0 - 2026-01-29 03:38:39,697 - TRAIN-LOGGER - INFO - Epoch 951 - TRAIN - Minibatch 0: weight_norm_model: 143.887268 loss: 0.960864 grad_norm_before_clip: 3.266902 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:40,961 - TRAIN-LOGGER - INFO - Epoch 951 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887268 weight_norm_u: 25.218954 loss: 0.960864 grad_norm_before_clip: 3.266902 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:40,961 - TRAIN-LOGGER - INFO - Epoch 951 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887283 weight_norm_u: 25.222990 loss: 0.964119 +RANK_0 - 2026-01-29 03:38:45,905 - TRAIN-LOGGER - INFO - Epoch 952 - TRAIN - Minibatch 0: weight_norm_model: 143.887283 loss: 0.964119 grad_norm_before_clip: 4.056335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:47,091 - TRAIN-LOGGER - INFO - Epoch 952 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887283 weight_norm_u: 25.218954 loss: 0.964119 grad_norm_before_clip: 4.056335 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:47,091 - TRAIN-LOGGER - INFO - Epoch 952 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887299 weight_norm_u: 25.222990 loss: 0.960951 +RANK_0 - 2026-01-29 03:38:51,749 - TRAIN-LOGGER - INFO - Epoch 953 - TRAIN - Minibatch 0: weight_norm_model: 143.887299 loss: 0.960951 grad_norm_before_clip: 2.846820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:52,993 - TRAIN-LOGGER - INFO - Epoch 953 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887299 weight_norm_u: 25.218954 loss: 0.960951 grad_norm_before_clip: 2.846820 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:52,994 - TRAIN-LOGGER - INFO - Epoch 953 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887299 weight_norm_u: 25.222990 loss: 0.962222 +RANK_0 - 2026-01-29 03:38:58,522 - TRAIN-LOGGER - INFO - Epoch 954 - TRAIN - Minibatch 0: weight_norm_model: 143.887299 loss: 0.962222 grad_norm_before_clip: 3.411536 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:59,704 - TRAIN-LOGGER - INFO - Epoch 954 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887299 weight_norm_u: 25.218954 loss: 0.962222 grad_norm_before_clip: 3.411536 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:38:59,704 - TRAIN-LOGGER - INFO - Epoch 954 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887283 weight_norm_u: 25.222990 loss: 0.963353 +RANK_0 - 2026-01-29 03:39:05,112 - TRAIN-LOGGER - INFO - Epoch 955 - TRAIN - Minibatch 0: weight_norm_model: 143.887283 loss: 0.963353 grad_norm_before_clip: 4.283216 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:06,390 - TRAIN-LOGGER - INFO - Epoch 955 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887283 weight_norm_u: 25.218954 loss: 0.963353 grad_norm_before_clip: 4.283216 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:06,390 - TRAIN-LOGGER - INFO - Epoch 955 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887283 weight_norm_u: 25.222990 loss: 0.963042 +RANK_0 - 2026-01-29 03:39:11,994 - TRAIN-LOGGER - INFO - Epoch 956 - TRAIN - Minibatch 0: weight_norm_model: 143.887283 loss: 0.963042 grad_norm_before_clip: 3.486077 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:13,225 - TRAIN-LOGGER - INFO - Epoch 956 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887283 weight_norm_u: 25.218954 loss: 0.963042 grad_norm_before_clip: 3.486077 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:13,225 - TRAIN-LOGGER - INFO - Epoch 956 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887283 weight_norm_u: 25.222990 loss: 0.962740 +RANK_0 - 2026-01-29 03:39:18,440 - TRAIN-LOGGER - INFO - Epoch 957 - TRAIN - Minibatch 0: weight_norm_model: 143.887283 loss: 0.962740 grad_norm_before_clip: 4.362058 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:19,684 - TRAIN-LOGGER - INFO - Epoch 957 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887283 weight_norm_u: 25.218954 loss: 0.962740 grad_norm_before_clip: 4.362058 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:19,684 - TRAIN-LOGGER - INFO - Epoch 957 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887299 weight_norm_u: 25.222990 loss: 0.960309 +RANK_0 - 2026-01-29 03:39:24,295 - TRAIN-LOGGER - INFO - Epoch 958 - TRAIN - Minibatch 0: weight_norm_model: 143.887299 loss: 0.960309 grad_norm_before_clip: 2.133935 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:25,770 - TRAIN-LOGGER - INFO - Epoch 958 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887299 weight_norm_u: 25.218954 loss: 0.960309 grad_norm_before_clip: 2.133935 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:25,770 - TRAIN-LOGGER - INFO - Epoch 958 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887299 weight_norm_u: 25.222990 loss: 0.960367 +RANK_0 - 2026-01-29 03:39:30,586 - TRAIN-LOGGER - INFO - Epoch 959 - TRAIN - Minibatch 0: weight_norm_model: 143.887299 loss: 0.960367 grad_norm_before_clip: 2.572952 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:31,923 - TRAIN-LOGGER - INFO - Epoch 959 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887299 weight_norm_u: 25.218954 loss: 0.960367 grad_norm_before_clip: 2.572952 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:31,924 - TRAIN-LOGGER - INFO - Epoch 959 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887299 weight_norm_u: 25.222990 loss: 0.961161 +RANK_0 - 2026-01-29 03:39:36,566 - TRAIN-LOGGER - INFO - Epoch 960 - TRAIN - Minibatch 0: weight_norm_model: 143.887299 loss: 0.961161 grad_norm_before_clip: 2.695760 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:37,737 - TRAIN-LOGGER - INFO - Epoch 960 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887299 weight_norm_u: 25.218954 loss: 0.961161 grad_norm_before_clip: 2.695760 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:37,738 - TRAIN-LOGGER - INFO - Epoch 960 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887268 weight_norm_u: 25.222990 loss: 0.959470 +RANK_0 - 2026-01-29 03:39:42,453 - TRAIN-LOGGER - INFO - Epoch 961 - TRAIN - Minibatch 0: weight_norm_model: 143.887268 loss: 0.959470 grad_norm_before_clip: 2.951218 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:43,579 - TRAIN-LOGGER - INFO - Epoch 961 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887268 weight_norm_u: 25.218954 loss: 0.959470 grad_norm_before_clip: 2.951218 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:43,580 - TRAIN-LOGGER - INFO - Epoch 961 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887268 weight_norm_u: 25.222990 loss: 0.959436 +RANK_0 - 2026-01-29 03:39:48,211 - TRAIN-LOGGER - INFO - Epoch 962 - TRAIN - Minibatch 0: weight_norm_model: 143.887268 loss: 0.959436 grad_norm_before_clip: 2.521066 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:49,358 - TRAIN-LOGGER - INFO - Epoch 962 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887268 weight_norm_u: 25.218954 loss: 0.959436 grad_norm_before_clip: 2.521066 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:49,358 - TRAIN-LOGGER - INFO - Epoch 962 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887283 weight_norm_u: 25.222990 loss: 0.958772 +RANK_0 - 2026-01-29 03:39:54,361 - TRAIN-LOGGER - INFO - Epoch 963 - TRAIN - Minibatch 0: weight_norm_model: 143.887283 loss: 0.958772 grad_norm_before_clip: 1.156909 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:55,584 - TRAIN-LOGGER - INFO - Epoch 963 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887283 weight_norm_u: 25.218954 loss: 0.958772 grad_norm_before_clip: 1.156909 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:39:55,585 - TRAIN-LOGGER - INFO - Epoch 963 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887299 weight_norm_u: 25.222990 loss: 0.961197 +RANK_0 - 2026-01-29 03:40:00,667 - TRAIN-LOGGER - INFO - Epoch 964 - TRAIN - Minibatch 0: weight_norm_model: 143.887299 loss: 0.961197 grad_norm_before_clip: 2.849513 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:01,832 - TRAIN-LOGGER - INFO - Epoch 964 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887299 weight_norm_u: 25.218954 loss: 0.961197 grad_norm_before_clip: 2.849513 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:01,832 - TRAIN-LOGGER - INFO - Epoch 964 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887314 weight_norm_u: 25.222990 loss: 0.961241 +RANK_0 - 2026-01-29 03:40:06,885 - TRAIN-LOGGER - INFO - Epoch 965 - TRAIN - Minibatch 0: weight_norm_model: 143.887314 loss: 0.961241 grad_norm_before_clip: 3.399744 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:08,039 - TRAIN-LOGGER - INFO - Epoch 965 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887314 weight_norm_u: 25.218954 loss: 0.961241 grad_norm_before_clip: 3.399744 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:08,039 - TRAIN-LOGGER - INFO - Epoch 965 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887314 weight_norm_u: 25.222990 loss: 0.962178 +RANK_0 - 2026-01-29 03:40:13,127 - TRAIN-LOGGER - INFO - Epoch 966 - TRAIN - Minibatch 0: weight_norm_model: 143.887314 loss: 0.962178 grad_norm_before_clip: 4.461299 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:14,358 - TRAIN-LOGGER - INFO - Epoch 966 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887314 weight_norm_u: 25.218954 loss: 0.962178 grad_norm_before_clip: 4.461299 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:14,358 - TRAIN-LOGGER - INFO - Epoch 966 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887314 weight_norm_u: 25.222990 loss: 0.960009 +RANK_0 - 2026-01-29 03:40:19,049 - TRAIN-LOGGER - INFO - Epoch 967 - TRAIN - Minibatch 0: weight_norm_model: 143.887314 loss: 0.960009 grad_norm_before_clip: 3.789791 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:20,460 - TRAIN-LOGGER - INFO - Epoch 967 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887314 weight_norm_u: 25.218954 loss: 0.960009 grad_norm_before_clip: 3.789791 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:20,460 - TRAIN-LOGGER - INFO - Epoch 967 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887329 weight_norm_u: 25.222990 loss: 0.960816 +RANK_0 - 2026-01-29 03:40:26,317 - TRAIN-LOGGER - INFO - Epoch 968 - TRAIN - Minibatch 0: weight_norm_model: 143.887329 loss: 0.960816 grad_norm_before_clip: 4.003795 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:27,719 - TRAIN-LOGGER - INFO - Epoch 968 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887329 weight_norm_u: 25.218954 loss: 0.960816 grad_norm_before_clip: 4.003795 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:27,719 - TRAIN-LOGGER - INFO - Epoch 968 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887344 weight_norm_u: 25.222990 loss: 0.959403 +RANK_0 - 2026-01-29 03:40:32,855 - TRAIN-LOGGER - INFO - Epoch 969 - TRAIN - Minibatch 0: weight_norm_model: 143.887344 loss: 0.959403 grad_norm_before_clip: 1.782708 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:34,244 - TRAIN-LOGGER - INFO - Epoch 969 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887344 weight_norm_u: 25.218954 loss: 0.959403 grad_norm_before_clip: 1.782708 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:34,244 - TRAIN-LOGGER - INFO - Epoch 969 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887360 weight_norm_u: 25.222990 loss: 0.959477 +RANK_0 - 2026-01-29 03:40:39,765 - TRAIN-LOGGER - INFO - Epoch 970 - TRAIN - Minibatch 0: weight_norm_model: 143.887360 loss: 0.959477 grad_norm_before_clip: 2.402660 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:41,281 - TRAIN-LOGGER - INFO - Epoch 970 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887360 weight_norm_u: 25.218954 loss: 0.959477 grad_norm_before_clip: 2.402660 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:41,281 - TRAIN-LOGGER - INFO - Epoch 970 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887360 weight_norm_u: 25.222990 loss: 0.960141 +RANK_0 - 2026-01-29 03:40:46,210 - TRAIN-LOGGER - INFO - Epoch 971 - TRAIN - Minibatch 0: weight_norm_model: 143.887360 loss: 0.960141 grad_norm_before_clip: 3.007742 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:47,690 - TRAIN-LOGGER - INFO - Epoch 971 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887360 weight_norm_u: 25.218954 loss: 0.960141 grad_norm_before_clip: 3.007742 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:47,690 - TRAIN-LOGGER - INFO - Epoch 971 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887360 weight_norm_u: 25.222990 loss: 0.958476 +RANK_0 - 2026-01-29 03:40:52,476 - TRAIN-LOGGER - INFO - Epoch 972 - TRAIN - Minibatch 0: weight_norm_model: 143.887360 loss: 0.958476 grad_norm_before_clip: 1.547223 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:53,869 - TRAIN-LOGGER - INFO - Epoch 972 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887360 weight_norm_u: 25.218954 loss: 0.958476 grad_norm_before_clip: 1.547223 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:40:53,870 - TRAIN-LOGGER - INFO - Epoch 972 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887360 weight_norm_u: 25.222990 loss: 0.960188 +RANK_0 - 2026-01-29 03:40:58,852 - TRAIN-LOGGER - INFO - Epoch 973 - TRAIN - Minibatch 0: weight_norm_model: 143.887360 loss: 0.960188 grad_norm_before_clip: 3.736833 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:00,039 - TRAIN-LOGGER - INFO - Epoch 973 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887360 weight_norm_u: 25.218954 loss: 0.960188 grad_norm_before_clip: 3.736833 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:00,040 - TRAIN-LOGGER - INFO - Epoch 973 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887360 weight_norm_u: 25.222990 loss: 0.959654 +RANK_0 - 2026-01-29 03:41:04,752 - TRAIN-LOGGER - INFO - Epoch 974 - TRAIN - Minibatch 0: weight_norm_model: 143.887360 loss: 0.959654 grad_norm_before_clip: 3.162237 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:05,992 - TRAIN-LOGGER - INFO - Epoch 974 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887360 weight_norm_u: 25.218954 loss: 0.959654 grad_norm_before_clip: 3.162237 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:05,992 - TRAIN-LOGGER - INFO - Epoch 974 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887390 weight_norm_u: 25.222990 loss: 0.958886 +RANK_0 - 2026-01-29 03:41:10,666 - TRAIN-LOGGER - INFO - Epoch 975 - TRAIN - Minibatch 0: weight_norm_model: 143.887390 loss: 0.958886 grad_norm_before_clip: 1.403814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:11,917 - TRAIN-LOGGER - INFO - Epoch 975 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887390 weight_norm_u: 25.218954 loss: 0.958886 grad_norm_before_clip: 1.403814 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:11,918 - TRAIN-LOGGER - INFO - Epoch 975 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887421 weight_norm_u: 25.222990 loss: 0.961250 +RANK_0 - 2026-01-29 03:41:17,112 - TRAIN-LOGGER - INFO - Epoch 976 - TRAIN - Minibatch 0: weight_norm_model: 143.887421 loss: 0.961250 grad_norm_before_clip: 2.433443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:18,243 - TRAIN-LOGGER - INFO - Epoch 976 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887421 weight_norm_u: 25.218954 loss: 0.961250 grad_norm_before_clip: 2.433443 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:18,243 - TRAIN-LOGGER - INFO - Epoch 976 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887421 weight_norm_u: 25.222990 loss: 0.961368 +RANK_0 - 2026-01-29 03:41:22,864 - TRAIN-LOGGER - INFO - Epoch 977 - TRAIN - Minibatch 0: weight_norm_model: 143.887421 loss: 0.961368 grad_norm_before_clip: 2.811039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:24,053 - TRAIN-LOGGER - INFO - Epoch 977 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887421 weight_norm_u: 25.218954 loss: 0.961368 grad_norm_before_clip: 2.811039 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:24,054 - TRAIN-LOGGER - INFO - Epoch 977 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887421 weight_norm_u: 25.222990 loss: 0.959825 +RANK_0 - 2026-01-29 03:41:28,720 - TRAIN-LOGGER - INFO - Epoch 978 - TRAIN - Minibatch 0: weight_norm_model: 143.887421 loss: 0.959825 grad_norm_before_clip: 2.404871 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:29,916 - TRAIN-LOGGER - INFO - Epoch 978 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887421 weight_norm_u: 25.218954 loss: 0.959825 grad_norm_before_clip: 2.404871 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:29,916 - TRAIN-LOGGER - INFO - Epoch 978 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887405 weight_norm_u: 25.222990 loss: 0.960407 +RANK_0 - 2026-01-29 03:41:35,194 - TRAIN-LOGGER - INFO - Epoch 979 - TRAIN - Minibatch 0: weight_norm_model: 143.887405 loss: 0.960407 grad_norm_before_clip: 3.561311 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:36,316 - TRAIN-LOGGER - INFO - Epoch 979 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887405 weight_norm_u: 25.218954 loss: 0.960407 grad_norm_before_clip: 3.561311 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:36,316 - TRAIN-LOGGER - INFO - Epoch 979 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887405 weight_norm_u: 25.222990 loss: 0.961618 +RANK_0 - 2026-01-29 03:41:41,622 - TRAIN-LOGGER - INFO - Epoch 980 - TRAIN - Minibatch 0: weight_norm_model: 143.887405 loss: 0.961618 grad_norm_before_clip: 3.238375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:43,049 - TRAIN-LOGGER - INFO - Epoch 980 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887405 weight_norm_u: 25.218954 loss: 0.961618 grad_norm_before_clip: 3.238375 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:43,049 - TRAIN-LOGGER - INFO - Epoch 980 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887421 weight_norm_u: 25.222990 loss: 0.959612 +RANK_0 - 2026-01-29 03:41:48,364 - TRAIN-LOGGER - INFO - Epoch 981 - TRAIN - Minibatch 0: weight_norm_model: 143.887421 loss: 0.959612 grad_norm_before_clip: 3.238917 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:49,602 - TRAIN-LOGGER - INFO - Epoch 981 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887421 weight_norm_u: 25.218954 loss: 0.959612 grad_norm_before_clip: 3.238917 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:49,603 - TRAIN-LOGGER - INFO - Epoch 981 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887436 weight_norm_u: 25.222990 loss: 0.958385 +RANK_0 - 2026-01-29 03:41:55,458 - TRAIN-LOGGER - INFO - Epoch 982 - TRAIN - Minibatch 0: weight_norm_model: 143.887436 loss: 0.958385 grad_norm_before_clip: 1.276771 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:56,851 - TRAIN-LOGGER - INFO - Epoch 982 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887436 weight_norm_u: 25.218954 loss: 0.958385 grad_norm_before_clip: 1.276771 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:41:56,852 - TRAIN-LOGGER - INFO - Epoch 982 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887466 weight_norm_u: 25.222990 loss: 0.962112 +RANK_0 - 2026-01-29 03:42:02,383 - TRAIN-LOGGER - INFO - Epoch 983 - TRAIN - Minibatch 0: weight_norm_model: 143.887466 loss: 0.962112 grad_norm_before_clip: 2.974057 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:03,626 - TRAIN-LOGGER - INFO - Epoch 983 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887466 weight_norm_u: 25.218954 loss: 0.962112 grad_norm_before_clip: 2.974057 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:03,626 - TRAIN-LOGGER - INFO - Epoch 983 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887482 weight_norm_u: 25.222990 loss: 0.966527 +RANK_0 - 2026-01-29 03:42:08,842 - TRAIN-LOGGER - INFO - Epoch 984 - TRAIN - Minibatch 0: weight_norm_model: 143.887482 loss: 0.966527 grad_norm_before_clip: 5.856460 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:10,056 - TRAIN-LOGGER - INFO - Epoch 984 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887482 weight_norm_u: 25.218954 loss: 0.966527 grad_norm_before_clip: 5.856460 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:10,056 - TRAIN-LOGGER - INFO - Epoch 984 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887466 weight_norm_u: 25.222990 loss: 0.964441 +RANK_0 - 2026-01-29 03:42:14,695 - TRAIN-LOGGER - INFO - Epoch 985 - TRAIN - Minibatch 0: weight_norm_model: 143.887466 loss: 0.964441 grad_norm_before_clip: 5.651469 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:15,987 - TRAIN-LOGGER - INFO - Epoch 985 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887466 weight_norm_u: 25.218954 loss: 0.964441 grad_norm_before_clip: 5.651469 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:15,988 - TRAIN-LOGGER - INFO - Epoch 985 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887451 weight_norm_u: 25.222990 loss: 0.959791 +RANK_0 - 2026-01-29 03:42:21,216 - TRAIN-LOGGER - INFO - Epoch 986 - TRAIN - Minibatch 0: weight_norm_model: 143.887451 loss: 0.959791 grad_norm_before_clip: 2.868711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:22,456 - TRAIN-LOGGER - INFO - Epoch 986 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887451 weight_norm_u: 25.218954 loss: 0.959791 grad_norm_before_clip: 2.868711 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:22,457 - TRAIN-LOGGER - INFO - Epoch 986 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887421 weight_norm_u: 25.222990 loss: 0.960030 +RANK_0 - 2026-01-29 03:42:27,065 - TRAIN-LOGGER - INFO - Epoch 987 - TRAIN - Minibatch 0: weight_norm_model: 143.887421 loss: 0.960030 grad_norm_before_clip: 2.006663 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:28,284 - TRAIN-LOGGER - INFO - Epoch 987 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887421 weight_norm_u: 25.218954 loss: 0.960030 grad_norm_before_clip: 2.006663 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:28,284 - TRAIN-LOGGER - INFO - Epoch 987 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887421 weight_norm_u: 25.222990 loss: 0.961184 +RANK_0 - 2026-01-29 03:42:32,685 - TRAIN-LOGGER - INFO - Epoch 988 - TRAIN - Minibatch 0: weight_norm_model: 143.887421 loss: 0.961184 grad_norm_before_clip: 3.533265 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:33,820 - TRAIN-LOGGER - INFO - Epoch 988 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887421 weight_norm_u: 25.218954 loss: 0.961184 grad_norm_before_clip: 3.533265 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:33,821 - TRAIN-LOGGER - INFO - Epoch 988 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887421 weight_norm_u: 25.222990 loss: 0.960823 +RANK_0 - 2026-01-29 03:42:38,270 - TRAIN-LOGGER - INFO - Epoch 989 - TRAIN - Minibatch 0: weight_norm_model: 143.887421 loss: 0.960823 grad_norm_before_clip: 2.358714 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:39,514 - TRAIN-LOGGER - INFO - Epoch 989 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887421 weight_norm_u: 25.218954 loss: 0.960823 grad_norm_before_clip: 2.358714 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:39,514 - TRAIN-LOGGER - INFO - Epoch 989 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887436 weight_norm_u: 25.222990 loss: 0.959881 +RANK_0 - 2026-01-29 03:42:44,032 - TRAIN-LOGGER - INFO - Epoch 990 - TRAIN - Minibatch 0: weight_norm_model: 143.887436 loss: 0.959881 grad_norm_before_clip: 1.624120 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:45,424 - TRAIN-LOGGER - INFO - Epoch 990 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887436 weight_norm_u: 25.218954 loss: 0.959881 grad_norm_before_clip: 1.624120 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:45,424 - TRAIN-LOGGER - INFO - Epoch 990 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887451 weight_norm_u: 25.222990 loss: 0.959437 +RANK_0 - 2026-01-29 03:42:50,267 - TRAIN-LOGGER - INFO - Epoch 991 - TRAIN - Minibatch 0: weight_norm_model: 143.887451 loss: 0.959437 grad_norm_before_clip: 1.994508 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:51,719 - TRAIN-LOGGER - INFO - Epoch 991 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887451 weight_norm_u: 25.218954 loss: 0.959437 grad_norm_before_clip: 1.994508 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:51,719 - TRAIN-LOGGER - INFO - Epoch 991 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887451 weight_norm_u: 25.222990 loss: 0.961043 +RANK_0 - 2026-01-29 03:42:56,503 - TRAIN-LOGGER - INFO - Epoch 992 - TRAIN - Minibatch 0: weight_norm_model: 143.887451 loss: 0.961043 grad_norm_before_clip: 3.529848 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:57,718 - TRAIN-LOGGER - INFO - Epoch 992 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887451 weight_norm_u: 25.218954 loss: 0.961043 grad_norm_before_clip: 3.529848 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:42:57,719 - TRAIN-LOGGER - INFO - Epoch 992 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887436 weight_norm_u: 25.222990 loss: 0.958686 +RANK_0 - 2026-01-29 03:43:02,909 - TRAIN-LOGGER - INFO - Epoch 993 - TRAIN - Minibatch 0: weight_norm_model: 143.887436 loss: 0.958686 grad_norm_before_clip: 1.645943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:04,019 - TRAIN-LOGGER - INFO - Epoch 993 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887436 weight_norm_u: 25.218954 loss: 0.958686 grad_norm_before_clip: 1.645943 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:04,020 - TRAIN-LOGGER - INFO - Epoch 993 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887436 weight_norm_u: 25.222990 loss: 0.959045 +RANK_0 - 2026-01-29 03:43:09,156 - TRAIN-LOGGER - INFO - Epoch 994 - TRAIN - Minibatch 0: weight_norm_model: 143.887436 loss: 0.959045 grad_norm_before_clip: 1.775999 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:10,364 - TRAIN-LOGGER - INFO - Epoch 994 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887436 weight_norm_u: 25.218954 loss: 0.959045 grad_norm_before_clip: 1.775999 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:10,365 - TRAIN-LOGGER - INFO - Epoch 994 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887466 weight_norm_u: 25.222990 loss: 0.959340 +RANK_0 - 2026-01-29 03:43:15,210 - TRAIN-LOGGER - INFO - Epoch 995 - TRAIN - Minibatch 0: weight_norm_model: 143.887466 loss: 0.959340 grad_norm_before_clip: 3.587066 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:16,748 - TRAIN-LOGGER - INFO - Epoch 995 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887466 weight_norm_u: 25.218954 loss: 0.959340 grad_norm_before_clip: 3.587066 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:16,748 - TRAIN-LOGGER - INFO - Epoch 995 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887482 weight_norm_u: 25.222990 loss: 0.959264 +RANK_0 - 2026-01-29 03:43:22,202 - TRAIN-LOGGER - INFO - Epoch 996 - TRAIN - Minibatch 0: weight_norm_model: 143.887482 loss: 0.959264 grad_norm_before_clip: 3.365089 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:23,366 - TRAIN-LOGGER - INFO - Epoch 996 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887482 weight_norm_u: 25.218954 loss: 0.959264 grad_norm_before_clip: 3.365089 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:23,366 - TRAIN-LOGGER - INFO - Epoch 996 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887497 weight_norm_u: 25.222990 loss: 0.959732 +RANK_0 - 2026-01-29 03:43:29,362 - TRAIN-LOGGER - INFO - Epoch 997 - TRAIN - Minibatch 0: weight_norm_model: 143.887497 loss: 0.959732 grad_norm_before_clip: 3.447457 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:30,534 - TRAIN-LOGGER - INFO - Epoch 997 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887497 weight_norm_u: 25.218954 loss: 0.959732 grad_norm_before_clip: 3.447457 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:30,535 - TRAIN-LOGGER - INFO - Epoch 997 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887512 weight_norm_u: 25.222990 loss: 0.959625 +RANK_0 - 2026-01-29 03:43:35,853 - TRAIN-LOGGER - INFO - Epoch 998 - TRAIN - Minibatch 0: weight_norm_model: 143.887512 loss: 0.959625 grad_norm_before_clip: 1.993957 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:37,105 - TRAIN-LOGGER - INFO - Epoch 998 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887512 weight_norm_u: 25.218954 loss: 0.959625 grad_norm_before_clip: 1.993957 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:37,106 - TRAIN-LOGGER - INFO - Epoch 998 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887527 weight_norm_u: 25.222990 loss: 0.959412 +RANK_0 - 2026-01-29 03:43:42,165 - TRAIN-LOGGER - INFO - Epoch 999 - TRAIN - Minibatch 0: weight_norm_model: 143.887527 loss: 0.959412 grad_norm_before_clip: 2.150079 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:43,563 - TRAIN-LOGGER - INFO - Epoch 999 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887527 weight_norm_u: 25.218954 loss: 0.959412 grad_norm_before_clip: 2.150079 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:43,563 - TRAIN-LOGGER - INFO - Epoch 999 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887527 weight_norm_u: 25.222990 loss: 0.959706 +RANK_0 - 2026-01-29 03:43:48,333 - TRAIN-LOGGER - INFO - Epoch 1000 - TRAIN - Minibatch 0: weight_norm_model: 143.887527 loss: 0.959706 grad_norm_before_clip: 2.199228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:49,471 - TRAIN-LOGGER - INFO - Epoch 1000 - TRAIN: l1: 153.297699 uncertainty_estimate: 0.142125 weight_norm_model: 143.887527 weight_norm_u: 25.218954 loss: 0.959706 grad_norm_before_clip: 2.199228 OPT-OPTIMIZER_D-LR: 0.000010 +RANK_0 - 2026-01-29 03:43:49,471 - TRAIN-LOGGER - INFO - Epoch 1000 - VALIDATION: l1: 64.495476 uncertainty_estimate: 0.439144 weight_norm_model: 143.887527 weight_norm_u: 25.222990 loss: 0.959672