Spaces:
Sleeping
Sleeping
File size: 6,635 Bytes
2312199 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 | {
"task_id": "objective_hard_19",
"version": "2.0.0",
"created_at": "2026-03-18",
"metadata": {
"domain": "credit_card_optimization",
"difficulty": "hard",
"task_number": 19,
"complexity_hint": {
"max_tokens": 8000,
"expected_output": "multi-card portfolio with sequencing and full EV breakdown"
},
"requires_human_review": false
},
"prompt": {
"system": "",
"user": "You\u2019re an expert financial advisor. Tell the user how to change their credit card setup to maximize EV over the next 3 years.\n\n# **Credit Card Recommendation Request**\n\nCREDIT PROFILE\n\n* Current credit cards you are the primary account holder of: \n * Wells Fargo Platinum, $7,000 limit, 10+ years \n* FICO scores with source: FICO 830 (Wells Fargo) \n* Oldest credit card account age: 10+ years \n* Cards approved in the past 6 months: 0 \n* Cards approved in the past 12 months: 0 \n* Cards approved in the past 24 months: 0 \n* Annual income $: $150,000\n\nCATEGORIES\n\n* Ok with category-specific cards?: Yes \n* Ok with rotating category cards?: No \n* Estimate average monthly spend in the categories below. \n * Dining $: $250 (UberEats/DoorDash) \n * Groceries $: Sam\u2019s Club - $200 Kroger - $250 \n * Gas $: $150 (mostly Sam\u2019s Club) \n * Travel $: Approximately $5,000/year so about $420/month \n * Using abroad?: I travel internationally about once per year for about 1 week. \n * Other categories or stores: Amazon, approximately $100 per month \n * Other spend: Nothing in particular. Clothing stores here and there. \n * Pay rent by card? There\u2019s a 3% fee to pay with a credit card so I don\u2019t use this option.\n\nMEMBERSHIPS & SUBSCRIPTIONS\n\n* Amazon Prime member: Yes \n* Verizon postpaid customer: Yes \n* Costco or Sam's Club member: Sam's Club \n* Big bank customer: Wells Fargo \n* Open to business cards: Yes\n\nPURPOSE\n\n* Purpose of next card: I am largely looking for a new card because my current card has foreign transaction fees and I have an up coming international trip. Cash back and travel rewards would be a nice bonus. \n * Travel rewards preferences: I am pretty open but I do slightly prefer Delta. \n* Cards being considered: None in particular.\n\nThanks in advance\\!",
"knowledge_base_ref": "knowledge_base.md",
"kb_filter": [
"American Express Gold",
"American Express Platinum",
"Amex Blue Business Plus",
"Amex Blue Cash Preferred",
"Amex Business Gold",
"Amex Business Platinum",
"Amex Delta SkyMiles Gold",
"Amex Delta SkyMiles Platinum",
"Amex Delta SkyMiles Reserve",
"Amex Green",
"Bilt Blue",
"Bilt Obsidian",
"Bilt Palladium",
"Capital One Venture",
"Capital One Venture X",
"Chase Freedom Flex",
"Chase Freedom Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Unlimited",
"Chase Sapphire Preferred",
"Chase Sapphire Reserve",
"Citi Custom Cash",
"Citi Double Cash",
"Citi Strata Premier",
"Wells Fargo Autograph"
],
"system_prompt_ref": "system_prompt_template.md"
},
"scoring": {
"dimensions": {
"card_selection": {
"weight": 0.25,
"type": "automated",
"description": "F1 of recommended cards vs. optimal set",
"checks": {
"expected_cards": [
"Chase Sapphire Reserve",
"Amex Delta SkyMiles Gold",
"Chase Ink Business Preferred",
"American Express Platinum",
"American Express Gold"
]
},
"hard_constraint": false
},
"ev_accuracy": {
"weight": 0.3,
"type": "automated",
"description": "EV accuracy vs. computed ground truth",
"reference": {
"user_profile": {
"monthly_spend": {
"dining": 250.0,
"groceries": 0,
"gas": 150.0,
"travel": 0,
"flights": 0,
"hotels": 0,
"streaming": 0,
"online_shopping": 0,
"everything_else": 0
},
"lounge_visits_per_year": 0,
"delta_flights_per_year": 6,
"united_flights_per_year": 0,
"uses_uber": true,
"uses_doordash": true,
"uses_instacart": false,
"uses_streaming": false,
"has_global_entry": false,
"uses_clear": false,
"has_amazon_prime": true,
"uses_resy_restaurants": false,
"uses_hyatt_hotels": false,
"uses_marriott_hotels": false,
"uses_hilton_hotels": false,
"monthly_rent": 3.0,
"pays_housing_with_bilt": true,
"time_horizon_months": 36,
"existing_cards": [
"Wells Fargo Platinum"
],
"cards_opened_last_24_months": 0
},
"expected_card_ids": [
"chase_sapphire_reserve",
"amex_delta_skymiles_gold",
"chase_ink_business_preferred",
"american_express_platinum",
"american_express_gold"
],
"ev_tolerance_pct": 0.1
}
},
"factual_fidelity": {
"weight": 0.3,
"type": "automated",
"description": "Accuracy of factual claims about cards",
"reference": {
"extracted_claims": null,
"reference_ev_usd": null
}
},
"constraint_compliance": {
"weight": 0.15,
"type": "automated",
"description": "Respects user constraints and issuer rules",
"checks": {
"expected_cards": [
"Chase Sapphire Reserve",
"Amex Delta SkyMiles Gold",
"Chase Ink Business Preferred",
"American Express Platinum",
"American Express Gold"
],
"expected_housing_option": null
},
"hard_constraint": false
}
},
"passing_threshold": 0.5,
"hard_constraint_failure_zeroes_dimension": true
},
"reference_solution": {
"_status": "COMPUTED",
"recommended_cards": [
"Chase Sapphire Reserve",
"Amex Delta SkyMiles Gold",
"Chase Ink Business Preferred",
"American Express Platinum",
"American Express Gold"
],
"total_ev_usd": null,
"ev_breakdown": null,
"housing_option": null,
"key_constraints_flags": [],
"expert_notes": "Ground truth EV computed from card_database.json + user_profile at evaluation time."
}
}
|