File size: 1,014 Bytes
d8bc908 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 | {
"data": "training/data/tinyshakespeare.txt",
"out_dir": "models/checkpoints",
"run": "smoke-graph",
"reset": true,
"steps": 1,
"batch": 1,
"eval_batch": 0,
"accum": 1,
"ctx": 6,
"eval_steps": 1,
"eval_interval": 1,
"save_interval": 0,
"no_save": true,
"seed": 42,
"lr": 0.0001,
"weight_decay": 0.0,
"grad_clip": 1.0,
"optimizer": "signsgd",
"tscale_type": "T32",
"compute_dtype": "none",
"max_moe_iters": 1,
"accum_threshold": 3,
"freeze_scales": false,
"ternary_updates": true,
"allow_float_trainables": false,
"enable_image": false,
"enable_audio": false,
"disable_vq": false,
"disable_graph": false,
"disable_memory": true,
"disable_moe": true,
"cpu": false,
"audit": "Ternary state audit:\n logical ternary weights: 145,907,520\n ternary training state: 190.22 MB (T=27.83, E=11.62, E_accum=11.62, accum=139.15)\n trainable float params: 0 tensors, 0.00 MB\n frozen float params: 0 tensors, 0.00 MB\n float buffers: 0 tensors, 0.00 MB"
} |