{ "task_id": "easy_02", "version": "1.0.0", "created_at": "2026-03-11", "metadata": { "domain": "credit_card_optimization", "difficulty": "easy", "task_number": 2, "complexity_hint": { "max_tokens": 4000, "expected_output": "single card recommendation with EV calculation" }, "requires_human_review": true }, "prompt": { "system": "", "user": "You are a financial advisor tasked with giving the user the optimal credit card advice for their situation.\n\nUser profile: \n\\- $4,000 rent payment \n\\- $10,000 in other general expenses each month, $1,000 of which is groceries \n\\- Values extra Bilt cash not used for unlocking points on housing at $0.25 USD per $1 of Bilt cash\n\nWhat\u2019s the user\u2019s optimal Bilt card, and which of the two housing rewards options should he choose between? Explain your reasoning and show the user\u2019s expected value from the card.\n\nCard context: Bilt Blue, Bilt Obsidian, Bilt Palladium", "knowledge_base_ref": "knowledge_base.md", "kb_filter": [ "Bilt Blue", "Bilt Obsidian", "Bilt Palladium" ], "system_prompt_ref": "system_prompt_template.md" }, "scoring": { "dimensions": { "constraint_compliance": { "weight": 0.3, "type": "automated", "description": "Hard rule checks: velocity limits, eligibility, user constraints", "checks": { "velocity_rules": null, "eligibility_rules": null, "user_constraints": null, "expected_cards": [ "Bilt Palladium" ], "expected_housing_option": "flexible_bilt_cash", "key_constraints_flags": [ "housing_option_choice", "card_selection" ] }, "hard_constraint": false }, "ev_accuracy": { "weight": 0.4, "type": "automated", "description": "EV calculation accuracy vs. reference solution", "reference": { "reference_ev_usd": 7906.0, "ev_tolerance_pct": 0.05 } }, "reasoning_quality": { "weight": 0.2, "type": "human", "description": "Quality of tradeoff articulation and strategic reasoning (0-3 scale)", "rubric": { "0": "No reasoning or incorrect reasoning", "1": "Surface-level reasoning, misses key tradeoffs", "2": "Correct tradeoffs identified with clear justification", "3": "Expert-level nuance including edge cases and constraint interactions" }, "score": null }, "constraint_prioritization": { "weight": 0.1, "type": "human", "description": "Correct handling of ambiguity and conflicting constraints", "score": null } }, "passing_threshold": 0.6, "hard_constraint_failure_zeroes_dimension": true }, "reference_solution": { "_status": "EXPERT_REVIEWED", "recommended_cards": [ "Bilt Palladium" ], "total_ev_usd": 7906.0, "ev_breakdown": { "signup_bonuses_usd": 1175.0, "ongoing_rewards_usd": 6336.0, "credits_usd": 50.0, "annual_fees_usd": -495.0, "other_usd": 840.0 }, "housing_option": "flexible_bilt_cash", "key_constraints_flags": [ "housing_option_choice", "card_selection" ], "expert_notes": "Bilt Palladium + flexible Bilt Cash is optimal. Year 1 EV = $7,906. Signup: 50k pts ($1,100) + $300 Bilt Cash ($75) = $1,175. Ongoing: 2x on $10k = 240k pts/yr ($5,280) + 48k housing pts/yr ($1,056) = $6,336. Credits: $200 annual Bilt Cash ($50). Excess Bilt Cash: $280/mo * 12 * $0.25 = $840. Year 2+ EV = $4,835 (no signup). Assumes no value for lounge/travel credits." } }