File size: 1,014 Bytes
d8bc908
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
{
  "data": "training/data/tinyshakespeare.txt",
  "out_dir": "models/checkpoints",
  "run": "smoke-graph",
  "reset": true,
  "steps": 1,
  "batch": 1,
  "eval_batch": 0,
  "accum": 1,
  "ctx": 6,
  "eval_steps": 1,
  "eval_interval": 1,
  "save_interval": 0,
  "no_save": true,
  "seed": 42,
  "lr": 0.0001,
  "weight_decay": 0.0,
  "grad_clip": 1.0,
  "optimizer": "signsgd",
  "tscale_type": "T32",
  "compute_dtype": "none",
  "max_moe_iters": 1,
  "accum_threshold": 3,
  "freeze_scales": false,
  "ternary_updates": true,
  "allow_float_trainables": false,
  "enable_image": false,
  "enable_audio": false,
  "disable_vq": false,
  "disable_graph": false,
  "disable_memory": true,
  "disable_moe": true,
  "cpu": false,
  "audit": "Ternary state audit:\n  logical ternary weights: 145,907,520\n  ternary training state: 190.22 MB (T=27.83, E=11.62, E_accum=11.62, accum=139.15)\n  trainable float params: 0 tensors, 0.00 MB\n  frozen float params: 0 tensors, 0.00 MB\n  float buffers: 0 tensors, 0.00 MB"
}