{ "task_id": "easy_05", "version": "1.0.0", "created_at": "2026-03-11", "metadata": { "domain": "credit_card_optimization", "difficulty": "easy", "task_number": 5, "complexity_hint": { "max_tokens": 4000, "expected_output": "single card recommendation with EV calculation" }, "requires_human_review": true }, "prompt": { "system": "", "user": "You are an expert financial advisor tasked with giving your customer the optimal credit card advice for their situation.\n\nYour customer asks you the following: \u201cI just purchased a home and foresee 40-50K of purchases I will be making. Wanted to get your recommendation on the credit cads I should be getting.\u201d\n\nYou can safely assume he\u2019s looking to optimize rewards on only this spending and that his personal spending is already taken care of by other cards. You can also assume credit score won\u2019t be an issue.\n\nWhich cards should he get and what is his EV from using these cards on the $50K of purchases he mentioned?", "knowledge_base_ref": "knowledge_base.md", "kb_filter": [ "Amex Green", "American Express Gold", "Chase Sapphire Preferred", "Capital One Venture X", "American Express Platinum", "Chase Sapphire Reserve", "Citi Strata Premier", "Citi Strata Elite", "Amex Business Gold", "Chase Ink Business Preferred", "Capital One Venture", "Amex Blue Business Plus", "Amex Business Platinum", "Wells Fargo Autograph", "BofA Premium Rewards" ], "system_prompt_ref": "system_prompt_template.md" }, "scoring": { "dimensions": { "constraint_compliance": { "weight": 0.3, "type": "automated", "description": "Hard rule checks: velocity limits, eligibility, user constraints", "checks": { "velocity_rules": null, "eligibility_rules": null, "user_constraints": null, "expected_cards": [ "Amex Green", "American Express Gold", "Chase Sapphire Preferred", "Capital One Venture X", "American Express Platinum" ], "expected_housing_option": null, "key_constraints_flags": [ "application_velocity", "signup_bonus_optimization" ] }, "hard_constraint": false }, "ev_accuracy": { "weight": 0.4, "type": "automated", "description": "EV calculation accuracy vs. reference solution", "reference": { "reference_ev_usd": 5557.5, "ev_tolerance_pct": 0.05 } }, "reasoning_quality": { "weight": 0.2, "type": "human", "description": "Quality of tradeoff articulation and strategic reasoning (0-3 scale)", "rubric": { "0": "No reasoning or incorrect reasoning", "1": "Surface-level reasoning, misses key tradeoffs", "2": "Correct tradeoffs identified with clear justification", "3": "Expert-level nuance including edge cases and constraint interactions" }, "score": null }, "constraint_prioritization": { "weight": 0.1, "type": "human", "description": "Correct handling of ambiguity and conflicting constraints", "score": null } }, "passing_threshold": 0.6, "hard_constraint_failure_zeroes_dimension": true }, "reference_solution": { "_status": "EXPERT_REVIEWED", "recommended_cards": [ "Amex Green", "American Express Gold", "Chase Sapphire Preferred", "Capital One Venture X", "American Express Platinum" ], "total_ev_usd": 5557.5, "ev_breakdown": { "signup_bonuses_usd": 6217.5, "ongoing_rewards_usd": 1000.0, "credits_usd": 0.0, "annual_fees_usd": -1660.0, "other_usd": 0.0 }, "housing_option": null, "key_constraints_flags": [ "application_velocity", "signup_bonus_optimization" ], "expert_notes": "Optimize for signup bonuses on $50k one-time spend. Order matters for issuer rules: Amex Green ($650 net), Amex Gold 1 week later ($875 net), CSP ($1,135 net), Venture X ($992.50 net), Amex Platinum 90+ days after Gold ($905 net). Total bonus net = $4,557.50. Remaining $25k on Venture X at 2x = $1,000. Total EV = $5,557.50. More than 5 cards in this timeframe risks denials/shutdowns." } }