Upload training_logs/txc_bare_antidead_t3_kpos20__seed42.json with huggingface_hub

Browse files

Files changed (1) hide show

training_logs/txc_bare_antidead_t3_kpos20__seed42.json +112 -0

training_logs/txc_bare_antidead_t3_kpos20__seed42.json ADDED Viewed

	@@ -0,0 +1,112 @@

+{
+  "arch_id": "txc_bare_antidead_t3_kpos20",
+  "src_class": "TXCBareAntidead",
+  "src_module": "src.architectures.txc_bare_antidead",
+  "T": 3,
+  "T_max": null,
+  "t_sample": null,
+  "k_win": 60,
+  "k_pos": 20,
+  "shifts": null,
+  "alpha": null,
+  "gamma": null,
+  "n_scales": null,
+  "n_layers": null,
+  "mlc_layers": null,
+  "d_in": 2304,
+  "d_sae": 18432,
+  "subject_model": "google/gemma-2-2b",
+  "anchor_layer": 12,
+  "hook_name": null,
+  "seed": 42,
+  "phase": "phase7_unification",
+  "group": 2,
+  "recipe": "TXCBareAntidead at k_pos=20 (W Phase 1 sweep)",
+  "purpose": "W Phase 1 sweep cell \u2014 sparsity-matched TXC",
+  "batch_size": 4096,
+  "lr": 0.0003,
+  "max_steps": 25000,
+  "elapsed_s": 1988.125037908554,
+  "final_step": 4600,
+  "converged": true,
+  "plateau_last": 0.018206182183690075,
+  "loss": [
+    25338.6484375,
+    6515.59521484375,
+    5791.5185546875,
+    5459.94677734375,
+    5239.92822265625,
+    5088.38671875,
+    4971.3212890625,
+    4863.9306640625,
+    4865.43505859375,
+    4825.353515625,
+    4766.38037109375,
+    4717.3115234375,
+    4656.666015625,
+    4698.89599609375,
+    4653.7685546875,
+    4597.822265625,
+    4593.3125,
+    4595.89697265625,
+    4549.24951171875,
+    4528.59716796875,
+    4517.05078125,
+    4505.091796875,
+    4531.8037109375,
+    4488.9453125
+  ],
+  "l0": [
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0,
+    60.0
+  ],
+  "steps_logged": [
+    0,
+    200,
+    400,
+    600,
+    800,
+    1000,
+    1200,
+    1400,
+    1600,
+    1800,
+    2000,
+    2200,
+    2400,
+    2600,
+    2800,
+    3000,
+    3200,
+    3400,
+    3600,
+    3800,
+    4000,
+    4200,
+    4400,
+    4600
+  ],
+  "n_train_seqs": 24000
+}