lexenvs-harbor / data /tasks /objective_hard_16.json
endishai's picture
Upload folder using huggingface_hub
2312199 verified
{
"task_id": "objective_hard_16",
"version": "2.0.0",
"created_at": "2026-03-18",
"metadata": {
"domain": "credit_card_optimization",
"difficulty": "hard",
"task_number": 16,
"complexity_hint": {
"max_tokens": 8000,
"expected_output": "multi-card portfolio with sequencing and full EV breakdown"
},
"requires_human_review": false
},
"prompt": {
"system": "",
"user": "You\u2019re an expert financial advisor. Tell the user how to change their credit card setup to maximize EV over the next 3 years.\nHello\\! Trying to figure out what credit card would supplement the ones I currently have or can be beneficial\\! \nCurrently prioritizing travel and/or saving. Thank you in advance to anyone who takes the time to over this and give recommendations\\!\n\n*CREDIT PROFILE * Current credit cards you are the primary account holder of:\n\n* *Chase Sapphire Preferred, $21,500 limit, 04/2024* \n* *Chase Freedom, $22,900 limit, 07/2022* \n* *CareCredit, $500 limit, 08/2017* \n* *Discover, $5,500 limit, 05/2016*\n\n* FICO Scores with source (see note on FICO score sources below):\n\n* *Experian: 748*\n\n* Oldest credit card account age with you as primary name on the account:\n\n* *9 years*\n\n* Number of personal credit cards approved for in the past 6 months: *None*\n\n* Number of personal credit cards approved for in the past 12 months: *None*\n\n* Number of personal credit cards approved for in the past 24 months: *1 credit card*\n\n* Annual income $: *152,000*\n\nCATEGORIES\n\n* * OK with category-specific cards?: *Yes* \n* * OK with rotating category cards?: *Yes* \n* * Estimate average monthly spend in the categories below. Only include what you can pay by credit card. \n * * Dining $: *600* \n * * Groceries $: *100-200 per week* \n * * Gas $: *120* \n * * Travel $: *Not traveling as of now* \n * * Do you plan on using this card abroad for a significant length of time (study abroad, digital nomad, expat, extended travel)?: *If possible - thinking future travel would be between 1-2 weeks at a time 2-3times a year.* \n * * Any other categories (examples: phone/internet, insurance) or stores (example: Amazon) with significant, regular credit card spend (the more you specify, the better): *$120 for pest control every 3 months.* \n * * Any other significant, regular credit card spend you didn't include above?: *$No* \n * * Can you pay rent by credit card? *Don't know - paying a mortgage*\n\nMEMBERSHIPS & SUBSCRIPTIONS (delete lines that don't apply)\n\n* * Current member of Amazon Prime?: *No* \n* * Current Verizon postpaid customer?: *No* \n* * Current member of Costco or Sam's Club?: *Add-On member* \n* * Currently paying $13.99/month or more for Disney Bundle (Disney+ / Hulu / EPSN+) or other Hulu services?: *No (Paying Netflix and Spotify only)* \n* * Current member of Chase, US Bank or any other big bank?: *Yes - Chase* \n* * Active US military?: *No* \n* * Are you open to Business Cards?: *Maybe but don't have an active business - used to do some sell items on etsy (have thought of going back to this)*\n\nPURPOSE\n\n* * What's the purpose of your next card (choose ONE)?: *Saving Money and/or Travel complement* \n* * Do you have any cards you've been looking at? *No*",
"knowledge_base_ref": "knowledge_base.md",
"kb_filter": [
"American Express Gold",
"American Express Platinum",
"Amex Blue Business Plus",
"Amex Blue Cash Preferred",
"Amex Business Gold",
"Amex Business Platinum",
"Amex Green",
"Bilt Blue",
"Bilt Obsidian",
"Bilt Palladium",
"Capital One Venture",
"Capital One Venture X",
"Chase Freedom Flex",
"Chase Freedom Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Unlimited",
"Chase Sapphire Preferred",
"Chase Sapphire Reserve",
"Citi Custom Cash",
"Citi Double Cash",
"Citi Strata Premier",
"Wells Fargo Autograph"
],
"system_prompt_ref": "system_prompt_template.md"
},
"scoring": {
"dimensions": {
"card_selection": {
"weight": 0.25,
"type": "automated",
"description": "F1 of recommended cards vs. optimal set",
"checks": {
"expected_cards": [
"American Express Gold",
"Chase Sapphire Reserve",
"Chase Ink Business Preferred",
"American Express Platinum",
"Capital One Venture"
]
},
"hard_constraint": false
},
"ev_accuracy": {
"weight": 0.3,
"type": "automated",
"description": "EV accuracy vs. computed ground truth",
"reference": {
"user_profile": {
"monthly_spend": {
"dining": 300,
"groceries": 400,
"everything_else": 500
},
"time_horizon_months": 36
},
"expected_card_ids": [
"american_express_gold",
"chase_sapphire_reserve",
"chase_ink_business_preferred",
"american_express_platinum",
"capital_one_venture"
],
"ev_tolerance_pct": 0.1
}
},
"factual_fidelity": {
"weight": 0.3,
"type": "automated",
"description": "Accuracy of factual claims about cards",
"reference": {
"extracted_claims": null,
"reference_ev_usd": null
}
},
"constraint_compliance": {
"weight": 0.15,
"type": "automated",
"description": "Respects user constraints and issuer rules",
"checks": {
"expected_cards": [
"American Express Gold",
"Chase Sapphire Reserve",
"Chase Ink Business Preferred",
"American Express Platinum",
"Capital One Venture"
],
"expected_housing_option": null
},
"hard_constraint": false
}
},
"passing_threshold": 0.5,
"hard_constraint_failure_zeroes_dimension": true
},
"reference_solution": {
"_status": "COMPUTED",
"recommended_cards": [
"American Express Gold",
"Chase Sapphire Reserve",
"Chase Ink Business Preferred",
"American Express Platinum",
"Capital One Venture"
],
"total_ev_usd": null,
"ev_breakdown": null,
"housing_option": null,
"key_constraints_flags": [],
"expert_notes": "Ground truth EV computed from card_database.json + user_profile at evaluation time."
}
}