File size: 769 Bytes
de53a02
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
{
  "architecture": "HRM-Text (classification)",
  "reference": "sapientinc/HRM-Text, arXiv:2506.21734",
  "hidden_size": 768,
  "num_heads": 12,
  "head_dim": 64,
  "n_layers_H": 3,
  "n_layers_L": 3,
  "intermediate_size": 2048,
  "H_cycles": 2,
  "L_cycles": 3,
  "max_seq_len": 2048,
  "rope_base": 10000.0,
  "rope_scaling": 1.0,
  "bp_min_steps": 2,
  "bp_max_steps": 5,
  "vocab_size": 256,
  "param_count": 46206722,
  "id2label": {
    "0": "safe",
    "1": "injection"
  },
  "label2id": {
    "safe": 0,
    "injection": 1
  },
  "training": {
    "learning_rate": 0.00022,
    "epochs": 1,
    "batch_size": 32,
    "weight_decay": 0.1,
    "scheduler": "constant_with_warmup",
    "warmup_steps": 2000,
    "adam_beta2": 0.95,
    "precision": "bf16"
  }
}