{ "no_change": { "mode": "REGIMEN_OPT", "action_type": "KEEP_REGIMEN", "target_drug": null, "replacement_drug": null, "dose_bucket": "NA", "taper_days": null, "monitoring_plan": null, "evidence_query": null, "new_drug_name": null, "candidate_components": [], "candidate_id": "cand_01", "confidence": 0.8, "rationale_brief": "Baseline no-change policy." }, "rules_only": { "mode": "REGIMEN_OPT", "action_type": "SUBSTITUTE_WITHIN_CLASS", "target_drug": "opioid_like", "replacement_drug": "non_opioid_analgesic", "dose_bucket": "NA", "taper_days": null, "monitoring_plan": null, "evidence_query": null, "new_drug_name": null, "candidate_components": [], "candidate_id": "cand_04", "confidence": 0.75, "rationale_brief": "Rules-only selected top legal candidate." }, "greedy": { "mode": "REGIMEN_OPT", "action_type": "SUBSTITUTE_WITHIN_CLASS", "target_drug": "opioid_like", "replacement_drug": "non_opioid_analgesic", "dose_bucket": "NA", "taper_days": null, "monitoring_plan": null, "evidence_query": null, "new_drug_name": null, "candidate_components": [], "candidate_id": "cand_04", "confidence": 0.72, "rationale_brief": "Greedy safety/burden improvement baseline." }, "contextual_bandit": { "mode": "REGIMEN_OPT", "action_type": "SUBSTITUTE_WITHIN_CLASS", "target_drug": "opioid_like", "replacement_drug": "non_opioid_analgesic", "dose_bucket": "NA", "taper_days": null, "monitoring_plan": null, "evidence_query": null, "new_drug_name": null, "candidate_components": [], "candidate_id": "cand_04", "confidence": 0.68, "rationale_brief": "Contextual bandit selected candidate." }, "contextual_bandit_topk": [ { "candidate_id": "cand_09", "score": 1.1532307878304324, "exploration_bonus": 1.1532307878304324, "algorithm": "linucb" }, { "candidate_id": "cand_10", "score": 1.1489735636645433, "exploration_bonus": 1.1489735636645433, "algorithm": "linucb" }, { "candidate_id": "cand_08", "score": 1.1447401451857973, "exploration_bonus": 1.1447401451857973, "algorithm": "linucb" } ], "beam_search": { "mode": "REGIMEN_OPT", "action_type": "SUBSTITUTE_WITHIN_CLASS", "target_drug": "opioid_like", "replacement_drug": "non_opioid_analgesic", "dose_bucket": "NA", "taper_days": null, "monitoring_plan": null, "evidence_query": null, "new_drug_name": null, "candidate_components": [], "candidate_id": "cand_04", "confidence": 0.74, "rationale_brief": "Beam-search(3) top candidate." }, "policy_stack_ablations": { "bandit-only": { "avg_reward": 0.7616666666666667, "legality_rate": 1.0, "steps": 3.0 }, "llm-only": { "avg_reward": 0.7753333333333333, "legality_rate": 1.0, "steps": 3.0 }, "llm+bandit": { "avg_reward": 0.7753333333333333, "legality_rate": 1.0, "steps": 3.0 } } }