Spaces:
Sleeping
Sleeping
File size: 8,055 Bytes
2312199 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 | {
"task_id": "objective_hard_07",
"version": "2.0.0",
"created_at": "2026-03-18",
"metadata": {
"domain": "credit_card_optimization",
"difficulty": "hard",
"task_number": 7,
"complexity_hint": {
"max_tokens": 8000,
"expected_output": "multi-card portfolio with sequencing and full EV breakdown"
},
"requires_human_review": false
},
"prompt": {
"system": "",
"user": "You\u2019re an expert financial advisor. Tell the user how to change their credit card setup to maximize EV over the next 3 years.\nCREDIT PROFILE\n\n* Current credit cards you are the primary account holder of: *Wells Fargo Autograph - $1000 limit, 2/2022 \n *Wells Fargo Platinum - $7500 limit, early 2010s? \n *Wells Fargo Active Cash - $9500 limit, 9/2023 \n *Citi Double Cash - $4500 limit, 6/2023 \n *Citi Custom Cash - $7500 limit, 6/2023 \n *AMEX Blue Cash Everyday - $4500, 2015\u2019ish? \n *Chase Freedom Unlimited - $4000, 2019\u2019ish \n *Capital One Quicksilver - $15000, 2018\u2019ish.\n\n(Currently Active Cash card is nearly maxed out to pay off HVAC system to take advantage of 0% APR through next year)\n\n(Currently Custom Cash card is nearly maxed out to pay off new home expenses to take advantage of 0% APR into next year)\n\n* FICO Scores with source (see note on FICO score sources below): 766 (Citi App) \n* Oldest credit card account age with you as primary name on the account: 11 years \n* Number of personal credit cards approved for in the past 6 months: 3 \n* Number of personal credit cards approved for in the past 12 months: 3 \n* Number of personal credit cards approved for in the past 24 months: 4 \n* Annual income $: 80k\n\nCATEGORIES\n\n* OK with category-specific cards?: YES \n* OK with rotating category cards?: NO \n* Estimate average monthly spend in the categories below. Only include what you can pay by credit card. \n* Dining $: 250 \n* Groceries $: 400 \n* Gas $: 70 \n* Travel $: 40 (maybe one flight a year; split over 12 months. Looking to travel more in near future) \n* Do you plan on using this card abroad for a significant length of time (study abroad, digital nomad, expat, extended travel)?: NO, but do travel internationally every other year or so on average. \n* Any other categories (examples: phone/internet, insurance) or stores (example: Amazon) with significant, regular credit card spend (the more you specify, the better): $75 Amazon. $28 Cell Phone. $70 car insurance (State Farm) \n* Any other significant, regular credit card spend you didn't include above?: $20 Ring System, $16 appliance warranty, $28 Internet. Usually $100 for stuff I forget to budget for that doesn\u2019t align with consistent categories. \n* Can you pay rent by credit card? If yes, list rent amount and if there's a fee for paying by credit card: NO\n\nMEMBERSHIPS & SUBSCRIPTIONS\n\n* Current member of Chase, US Bank or any other big bank?: Chase\n\nPURPOSE\n\n* What's the purpose of your next card (choose ONE)?: Ensure I\u2019m maximizing/optimizing cash back and potential travel card for future. \n* Do you have any cards you've been looking at? Any applicable Delta card (live in ATL near Delta hub) Chase Sapphire Reserve or Preferred Blue Cash Preferred Open to all suggestions however to ensure all possible cash back categories are maximized or if a travel card is recommended. Not opposed to AF if I can extract value.\n\nUPDATE: Current cash back set up\n\nGas - 3% AMEX Blue Cash \nGroceries - 3% AMEX Blue Cash\n\n(Groceries - 5% Custom Cash typically; however currently used for 0% APR balance).\n\nOnline Shopping - 3% AMEX Blue Cash \nDining Out - 3% Chase Freedom Unlimited \nCatch All Rest - 2% Double Cash",
"knowledge_base_ref": "knowledge_base.md",
"kb_filter": [
"American Express Gold",
"American Express Platinum",
"Amex Blue Cash Preferred",
"Amex Delta SkyMiles Gold",
"Amex Delta SkyMiles Platinum",
"Amex Delta SkyMiles Reserve",
"Amex Green",
"Bilt Blue",
"Bilt Obsidian",
"Bilt Palladium",
"Capital One Venture",
"Capital One Venture X",
"Chase Freedom Flex",
"Chase Freedom Unlimited",
"Chase Sapphire Preferred",
"Chase Sapphire Reserve",
"Citi Custom Cash",
"Citi Double Cash",
"Citi Strata Premier",
"Wells Fargo Autograph"
],
"system_prompt_ref": "system_prompt_template.md"
},
"scoring": {
"dimensions": {
"card_selection": {
"weight": 0.25,
"type": "automated",
"description": "F1 of recommended cards vs. optimal set",
"checks": {
"expected_cards": [
"American Express Gold",
"Amex Delta SkyMiles Gold",
"Capital One Venture",
"Chase Sapphire Preferred",
"Chase Sapphire Reserve"
]
},
"hard_constraint": false
},
"ev_accuracy": {
"weight": 0.3,
"type": "automated",
"description": "EV accuracy vs. computed ground truth",
"reference": {
"user_profile": {
"monthly_spend": {
"dining": 250.0,
"groceries": 400.0,
"gas": 70.0,
"travel": 40.0,
"flights": 0,
"hotels": 0,
"streaming": 0,
"online_shopping": 0,
"everything_else": 0
},
"lounge_visits_per_year": 0,
"delta_flights_per_year": 6,
"united_flights_per_year": 0,
"uses_uber": false,
"uses_doordash": false,
"uses_instacart": false,
"uses_streaming": false,
"has_global_entry": false,
"uses_clear": false,
"has_amazon_prime": false,
"uses_resy_restaurants": false,
"uses_hyatt_hotels": false,
"uses_marriott_hotels": false,
"uses_hilton_hotels": false,
"monthly_rent": 0,
"pays_housing_with_bilt": false,
"time_horizon_months": 36,
"existing_cards": [
"Chase Freedom Unlimited",
"Sapphire Reserve",
"AMEX Blue Cash",
"Capital One Quicksilver",
"Citi Double Cash",
"Wells Fargo Autograph"
],
"cards_opened_last_24_months": 4
},
"expected_card_ids": [
"american_express_gold",
"amex_delta_skymiles_gold",
"capital_one_venture",
"chase_sapphire_preferred",
"chase_sapphire_reserve"
],
"ev_tolerance_pct": 0.1
}
},
"factual_fidelity": {
"weight": 0.3,
"type": "automated",
"description": "Accuracy of factual claims about cards",
"reference": {
"extracted_claims": null,
"reference_ev_usd": null
}
},
"constraint_compliance": {
"weight": 0.15,
"type": "automated",
"description": "Respects user constraints and issuer rules",
"checks": {
"expected_cards": [
"American Express Gold",
"Amex Delta SkyMiles Gold",
"Capital One Venture",
"Chase Sapphire Preferred",
"Chase Sapphire Reserve"
],
"expected_housing_option": null
},
"hard_constraint": false
}
},
"passing_threshold": 0.5,
"hard_constraint_failure_zeroes_dimension": true
},
"reference_solution": {
"_status": "COMPUTED",
"recommended_cards": [
"American Express Gold",
"Amex Delta SkyMiles Gold",
"Capital One Venture",
"Chase Sapphire Preferred",
"Chase Sapphire Reserve"
],
"total_ev_usd": null,
"ev_breakdown": null,
"housing_option": null,
"key_constraints_flags": [],
"expert_notes": "Ground truth EV computed from card_database.json + user_profile at evaluation time."
}
}
|