polyguard-openenv / docs /results /planner_grpo.json
TheJackBright's picture
Deploy PolyGuard OpenEnv Space
877add7 verified
{
"avg_reward": 0.77625,
"legality_rate": 1.0,
"severe_violation_rate": 0.0,
"abstention_rate": 0.0,
"avg_episode_length": 2.0,
"success_rate": 0.0,
"avg_burden_delta": 0.0,
"avg_safety_delta": 0.5,
"avg_dosing_quality": 0.75,
"avg_process_fidelity": 0.92,
"exploit_detection_count": 4.0,
"reward_columns": {
"format_compliance_score": 0.9990000000000001,
"candidate_alignment_score": 0.9990000000000001,
"legality_score": 0.9990000000000001,
"safety_delta_score": 0.5,
"burden_improvement_score": 0.5,
"disease_stability_score": 0.9000000000000002,
"dosing_quality_score": 0.75,
"abstention_quality_score": 0.5600000000000002,
"efficiency_score": 0.73,
"process_fidelity_score": 0.92,
"explanation_grounding_score": 0.7999999999999999,
"anti_cheat_score": 0.6663333333333333,
"uncertainty_calibration_score": 0.8699999999999998
}
}