{ "H_cycles": 2, "L_bp_cycles": [ 0, 3 ], "L_cycles": 3, "architectures": [ "HrmTextForCausalLM" ], "attention_bias": false, "attention_dropout": 0.0, "auto_map": { "AutoConfig": "configuration_hrm_text.HrmTextConfig", "AutoModel": "modeling_hrm_text.HrmTextModel", "AutoModelForCausalLM": "modeling_hrm_text.HrmTextForCausalLM" }, "bos_token_id": 6, "dtype": "bfloat16", "embedding_scale": 39.191835884530846, "eos_token_id": 11, "head_dim": 128, "hidden_act": "silu", "hidden_size": 1536, "initializer_range": 0.025515518153991442, "intermediate_size": 4096, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "hrm_text", "num_attention_heads": 12, "num_hidden_layers": 128, "num_key_value_heads": 12, "num_layers_per_stack": 16, "pad_token_id": 5, "prefix_lm": true, "quantization_config": { "act_bits": 4, "act_data_type": "mx_fp", "act_dynamic": true, "act_group_size": 32, "act_sym": true, "autoround_version": "0.12.3", "bits": 4, "data_type": "mx_fp", "group_size": 32, "iters": 0, "low_gpu_mem_usage": true, "packing_format": "auto_round:llm_compressor", "quant_method": "auto-round", "sym": true }, "rms_norm_eps": 1e-06, "rope_parameters": { "rope_theta": 10000.0, "rope_type": "default" }, "tie_word_embeddings": false, "transformers_version": "5.9.0", "use_cache": true, "vocab_size": 65536 }