| { |
| "architecture": "HRM-Text (classification)", |
| "reference": "sapientinc/HRM-Text, arXiv:2506.21734", |
| "hidden_size": 768, |
| "num_heads": 12, |
| "head_dim": 64, |
| "n_layers_H": 3, |
| "n_layers_L": 3, |
| "intermediate_size": 2048, |
| "H_cycles": 2, |
| "L_cycles": 3, |
| "max_seq_len": 2048, |
| "rope_base": 10000.0, |
| "rope_scaling": 1.0, |
| "bp_min_steps": 2, |
| "bp_max_steps": 5, |
| "vocab_size": 256, |
| "param_count": 46206722, |
| "id2label": { |
| "0": "safe", |
| "1": "injection" |
| }, |
| "label2id": { |
| "safe": 0, |
| "injection": 1 |
| }, |
| "training": { |
| "learning_rate": 0.00022, |
| "epochs": 1, |
| "batch_size": 32, |
| "weight_decay": 0.1, |
| "scheduler": "constant_with_warmup", |
| "warmup_steps": 2000, |
| "adam_beta2": 0.95, |
| "precision": "bf16" |
| } |
| } |