Spaces:

sahilfarib
/

FactEval

Running

Sahil al farib

Deploy FactEval: claim-level hallucination detection with Gradio demo

8fb73f8 2 days ago

1.38 kB

	"""
	Default configuration for FactEval models and parameters.
	"""

	# ── Model IDs (Hugging Face Hub) ─────────────────────────────────────────────
	# Claim extraction – chosen in Week 0: 1.5B was 3.5x faster with cleaner output
	CLAIM_MODEL = "Qwen/Qwen2.5-1.5B-Instruct"

	# Sentence embeddings for evidence retrieval
	EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"

	# NLI verification (used in Week 2)
	NLI_MODEL = "MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli"

	# ── Retrieval defaults ───────────────────────────────────────────────────────
	DEFAULT_TOP_K = 3
	MIN_EVIDENCE_SCORE = 0.3 # Below this, evidence is too weak to use

	# ── Claim extraction defaults ────────────────────────────────────────────────
	MAX_NEW_TOKENS = 200
	MAX_CLAIMS = 10

	CLAIM_SYSTEM_PROMPT = (
	"You are a claim extraction engine. Given a text, break it into atomic, "
	"independently verifiable claims. Each claim states exactly ONE fact. "
	"Return ONLY a numbered list. No explanations, no commentary."
	)

	CLAIM_USER_PROMPT = "Break this into atomic claims:\n\n{text}"