{ "model_type": "absolute_multihead_reward_model", "base_model": "./absolute-multitask-reward-model", "num_labels": 3, "label_order": [ "style", "faith", "identifier" ], "max_length": 1024, "recommended_overall_formula": "style_score * (0.5 * faith_score + 0.5 * identifier_score) * (identifier_score ** 1.5)", "notes": [ "Apply sigmoid to each logit before using scores.", "Do not use style_score alone for reranking.", "Keep input formatting consistent with training.", "For Longformer inference, set global_attention_mask[:, 0] = 1." ] }