| { | |
| "data": "training/data/tinyshakespeare.txt", | |
| "out_dir": "models/checkpoints", | |
| "run": "arb-text", | |
| "reset": false, | |
| "steps": 200, | |
| "batch": 1, | |
| "eval_batch": 0, | |
| "accum": 2, | |
| "ctx": 64, | |
| "eval_steps": 4, | |
| "eval_interval": 100, | |
| "save_interval": 500, | |
| "no_save": true, | |
| "seed": 42, | |
| "tscale_type": "T32", | |
| "compute_dtype": "none", | |
| "max_moe_iters": 2, | |
| "accum_threshold": 3, | |
| "freeze_scales": false, | |
| "enable_image": false, | |
| "enable_audio": false, | |
| "disable_vq": true, | |
| "disable_graph": false, | |
| "enable_memory": false, | |
| "disable_memory": false, | |
| "disable_moe": false, | |
| "cpu": false, | |
| "audit": "Ternary state audit:\n logical ternary weights: 1,246,223,808\n ternary training state: 1625.12 MB (T=237.70, E=99.47, E_accum=99.46, accum=1188.49)\n trainable float params: 0 tensors, 0.00 MB\n frozen float params: 0 tensors, 0.00 MB\n float buffers: 0 tensors, 0.00 MB" | |
| } |