Spaces:
Sleeping
Sleeping
File size: 4,869 Bytes
2312199 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 | {
"task_id": "medium_05",
"version": "1.0.0",
"created_at": "2026-03-11",
"metadata": {
"domain": "credit_card_optimization",
"difficulty": "medium",
"task_number": 5,
"complexity_hint": {
"max_tokens": 6000,
"expected_output": "multi-card strategy with 2-year timeline and EV breakdown"
},
"requires_human_review": true
},
"prompt": {
"system": "",
"user": "You are a financial advisor tasked with building the following user\u2019s credit card strategy for the next 2 years in order to maximize the user\u2019s expected value while staying within their constraints, assuming all offers stay constant.\n\nUser profile:\n\n* Age 38, income $160k, excellent credit \n* Monthly spending: $6,000 total \u2014 $2,200 travel (flights/hotels, 8\u201310 domestic trips/year, values lounge access at $30 a visit and goes once per trip, $1,800 dining/groceries, $800 online shopping, $500 rideshare, rest misc \n* Rent: $5,000, hasn\u2019t decided which Bilt housing option to choose \n* Already has 4 cards (Amex Blue Cash Preferred, Amex Gold, Capital One Venture X, Bilt Obsidian) \n* Pays in full every month \n* Goal: Maximize travel rewards \\+ lounge value over 12\u201324 months, but cap total lounge cost at $0 net (perks must offset fees) \n* Willing to have up to 5 cards\n\nWhat should the user\u2019s credit card strategy be over the next 2 years to maximize EV within these constraints?",
"knowledge_base_ref": "knowledge_base.md",
"kb_filter": [
"American Express Platinum",
"Chase Sapphire Preferred",
"Amex Blue Cash Preferred",
"American Express Gold",
"Capital One Venture X",
"Bilt Obsidian",
"Bilt Blue",
"Bilt Palladium",
"Chase Sapphire Reserve",
"Citi Strata Elite",
"Amex Green",
"Capital One Venture",
"Chase Freedom Unlimited",
"Chase Freedom Flex",
"Citi Strata Premier"
],
"system_prompt_ref": "system_prompt_template.md"
},
"scoring": {
"dimensions": {
"constraint_compliance": {
"weight": 0.3,
"type": "automated",
"description": "Hard rule checks: velocity limits, eligibility, user constraints",
"checks": {
"velocity_rules": null,
"eligibility_rules": null,
"user_constraints": null,
"expected_cards": [
"American Express Platinum",
"Chase Sapphire Preferred"
],
"expected_housing_option": "flexible_bilt_cash",
"key_constraints_flags": [
"cancel_existing_card",
"housing_option_choice",
"lounge_valuation",
"5_card_limit"
]
},
"hard_constraint": false
},
"ev_accuracy": {
"weight": 0.4,
"type": "automated",
"description": "EV calculation accuracy vs. reference solution",
"reference": {
"reference_ev_usd": 14966.0,
"ev_tolerance_pct": 0.05
}
},
"reasoning_quality": {
"weight": 0.2,
"type": "human",
"description": "Quality of tradeoff articulation and strategic reasoning (0-3 scale)",
"rubric": {
"0": "No reasoning or incorrect reasoning",
"1": "Surface-level reasoning, misses key tradeoffs",
"2": "Correct tradeoffs identified with clear justification",
"3": "Expert-level nuance including edge cases and constraint interactions"
},
"score": null
},
"constraint_prioritization": {
"weight": 0.1,
"type": "human",
"description": "Correct handling of ambiguity and conflicting constraints",
"score": null
}
},
"passing_threshold": 0.6,
"hard_constraint_failure_zeroes_dimension": true
},
"reference_solution": {
"_status": "EXPERT_REVIEWED",
"recommended_cards": [
"American Express Platinum",
"Chase Sapphire Preferred"
],
"total_ev_usd": 14966.0,
"ev_breakdown": {
"signup_bonuses_usd": 3137.5,
"ongoing_rewards_usd": 10318.5,
"credits_usd": 4470.0,
"annual_fees_usd": -2960.0,
"other_usd": 0.0
},
"housing_option": "flexible_bilt_cash",
"key_constraints_flags": [
"cancel_existing_card",
"housing_option_choice",
"lounge_valuation",
"5_card_limit"
],
"expert_notes": "Cancel Amex Gold. Choose flexible Bilt Cash for rent. Get Amex Platinum (80k bonus, 8k spend in 6mo), then CSP (75k bonus, 5k in 3mo). Months 1-3: bonus hunting. Month 4+: Amex Plat 5x flights ($1,100), Blue Cash Pref 6% grocery ($900), Bilt 3.3x blended on rest ($4,000-4,900). Amex credits $3,500 (resy/uber/hotel/streaming/airline). Cap1 credits $970. Total ongoing spend earn $10,318.50. Fees include Amex Plat + VX + CSP + Bilt."
}
}
|