File size: 1,018 Bytes
d8bc908
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
{
  "data": "training/data/tinyshakespeare.txt",
  "out_dir": "models/checkpoints",
  "run": "smoke-train",
  "reset": true,
  "steps": 1,
  "batch": 1,
  "eval_batch": 0,
  "accum": 1,
  "ctx": 4,
  "eval_steps": 1,
  "eval_interval": 1,
  "save_interval": 0,
  "no_save": true,
  "seed": 42,
  "lr": 0.0001,
  "weight_decay": 0.0,
  "grad_clip": 1.0,
  "optimizer": "signsgd",
  "tscale_type": "T32",
  "compute_dtype": "none",
  "max_moe_iters": 1,
  "accum_threshold": 3,
  "freeze_scales": false,
  "ternary_updates": true,
  "allow_float_trainables": false,
  "enable_image": false,
  "enable_audio": false,
  "disable_vq": true,
  "disable_graph": true,
  "disable_memory": true,
  "disable_moe": false,
  "cpu": false,
  "audit": "Ternary state audit:\n  logical ternary weights: 1,246,263,744\n  ternary training state: 1625.18 MB (T=237.71, E=99.48, E_accum=99.46, accum=1188.53)\n  trainable float params: 0 tensors, 0.00 MB\n  frozen float params: 0 tensors, 0.00 MB\n  float buffers: 0 tensors, 0.00 MB"
}