{ "status": "ok", "baseline": "outputs/reports/baselines.json", "candidate": "outputs/reports/benchmark_report.json", "deltas": { "avg_reward": -0.0025, "legality_rate": 0.0, "success_rate": 0.0, "avg_process_fidelity": 0.92, "timeout_rate": 0.0, "failure_visible_rate": 0.0 }, "gate": { "avg_reward_up": false, "legality_up": true, "success_up": true }, "improved": false }