| """Tests for literature-grounded benchmark utilities.""" | |
| from training.literature_benchmark import ( | |
| run_paper_benchmark, | |
| select_literature_scenario, | |
| ) | |
| def test_select_literature_scenario_for_ipf_prompt(): | |
| scenario = select_literature_scenario( | |
| "Validate SPP1-positive macrophage findings in idiopathic pulmonary fibrosis." | |
| ) | |
| assert scenario.name == "biomarker_validation_lung" | |
| def test_select_literature_scenario_for_trajectory_prompt(): | |
| scenario = select_literature_scenario( | |
| "Recover branching hematopoietic lineages and branch point transcription factors." | |
| ) | |
| assert scenario.name == "hematopoiesis_trajectory" | |
| def test_run_paper_benchmark_matches_curated_findings(): | |
| result = run_paper_benchmark( | |
| problem_statement=( | |
| "Design a follow-up validation experiment for candidate biomarker " | |
| "SPP1 in idiopathic pulmonary fibrosis." | |
| ), | |
| scenario_name="biomarker_validation_lung", | |
| domain_randomise=False, | |
| ) | |
| assert result.total_steps >= 1 | |
| assert result.matched_papers | |
| assert result.match_ratio >= (2 / 3) | |
| assert any("SPP1" in finding for finding in result.matched_findings) | |