Spaces:

Ev3Dev
/

Bio-EnvRL

Sleeping

Bio-EnvRL / tests /test_literature_benchmark.py

Upload folder using huggingface_hub

df98fca verified about 1 month ago

1.24 kB

	"""Tests for literature-grounded benchmark utilities."""

	from training.literature_benchmark import (
	run_paper_benchmark,
	select_literature_scenario,
	)


	def test_select_literature_scenario_for_ipf_prompt():
	scenario = select_literature_scenario(
	"Validate SPP1-positive macrophage findings in idiopathic pulmonary fibrosis."
	)
	assert scenario.name == "biomarker_validation_lung"


	def test_select_literature_scenario_for_trajectory_prompt():
	scenario = select_literature_scenario(
	"Recover branching hematopoietic lineages and branch point transcription factors."
	)
	assert scenario.name == "hematopoiesis_trajectory"


	def test_run_paper_benchmark_matches_curated_findings():
	result = run_paper_benchmark(
	problem_statement=(
	"Design a follow-up validation experiment for candidate biomarker "
	"SPP1 in idiopathic pulmonary fibrosis."
	),
	scenario_name="biomarker_validation_lung",
	domain_randomise=False,
	)

	assert result.total_steps >= 1
	assert result.matched_papers
	assert result.match_ratio >= (2 / 3)
	assert any("SPP1" in finding for finding in result.matched_findings)