File size: 1,378 Bytes
8fb73f8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
"""
Default configuration for FactEval models and parameters.
"""

# ── Model IDs (Hugging Face Hub) ─────────────────────────────────────────────
# Claim extraction – chosen in Week 0: 1.5B was 3.5x faster with cleaner output
CLAIM_MODEL = "Qwen/Qwen2.5-1.5B-Instruct"

# Sentence embeddings for evidence retrieval
EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"

# NLI verification (used in Week 2)
NLI_MODEL = "MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli"

# ── Retrieval defaults ───────────────────────────────────────────────────────
DEFAULT_TOP_K = 3
MIN_EVIDENCE_SCORE = 0.3  # Below this, evidence is too weak to use

# ── Claim extraction defaults ────────────────────────────────────────────────
MAX_NEW_TOKENS = 200
MAX_CLAIMS = 10

CLAIM_SYSTEM_PROMPT = (
    "You are a claim extraction engine. Given a text, break it into atomic, "
    "independently verifiable claims. Each claim states exactly ONE fact. "
    "Return ONLY a numbered list. No explanations, no commentary."
)

CLAIM_USER_PROMPT = "Break this into atomic claims:\n\n{text}"