lexenvs-harbor / data /tasks /medium_03.json
endishai's picture
Upload folder using huggingface_hub
2312199 verified
{
"task_id": "medium_03",
"version": "1.0.0",
"created_at": "2026-03-11",
"metadata": {
"domain": "credit_card_optimization",
"difficulty": "medium",
"task_number": 3,
"complexity_hint": {
"max_tokens": 6000,
"expected_output": "multi-card strategy with 2-year timeline and EV breakdown"
},
"requires_human_review": true
},
"prompt": {
"system": "",
"user": "You are a financial advisor tasked with building the following user\u2019s credit card strategy for the next 2 years in order to maximize the user\u2019s expected value while staying within their constraints, assuming all offers stay constant.\n\nUser profile:\n\n* Age 40, income $500k+, excellent credit score \n* Monthly spending: $20,000 total \u2014 $5,000 domestic business travel/hotels, $2,000 dining, $2,000 online/ads, $2,000 utilities/office, $2,000 groceries, $500 gas, $500 rideshare, $500 food delivery, and the rest misc \n* Already has the following cards: Amex Platinum, Chase Sapphire Preferred \n* Values luxurious perks, especially when traveling \n* Pays in full every month \n* Doesn\u2019t have much time to optimize every little thing, so annual fee for new cards must pay for itself twice over\n\nMap out which credit cards he should get and when over the next 2 years in order to optimize his EV. Feel free to cancel any existing cards if needed.",
"knowledge_base_ref": "knowledge_base.md",
"kb_filter": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite",
"American Express Platinum",
"Chase Sapphire Preferred",
"Chase Sapphire Reserve",
"Amex Blue Business Plus",
"Amex Blue Business Cash",
"Chase Business Sapphire Reserve",
"Capital One Business Spark 2X Miles",
"Citi Strata Elite"
],
"system_prompt_ref": "system_prompt_template.md"
},
"scoring": {
"dimensions": {
"constraint_compliance": {
"weight": 0.3,
"type": "automated",
"description": "Hard rule checks: velocity limits, eligibility, user constraints",
"checks": {
"velocity_rules": null,
"eligibility_rules": null,
"user_constraints": null,
"expected_cards": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite"
],
"expected_housing_option": null,
"key_constraints_flags": [
"high_spend",
"business_cards",
"signup_bonus_churn",
"shutdown_risk"
]
},
"hard_constraint": false
},
"ev_accuracy": {
"weight": 0.4,
"type": "automated",
"description": "EV calculation accuracy vs. reference solution",
"reference": {
"reference_ev_usd": 24995.0,
"ev_tolerance_pct": 0.05
}
},
"reasoning_quality": {
"weight": 0.2,
"type": "human",
"description": "Quality of tradeoff articulation and strategic reasoning (0-3 scale)",
"rubric": {
"0": "No reasoning or incorrect reasoning",
"1": "Surface-level reasoning, misses key tradeoffs",
"2": "Correct tradeoffs identified with clear justification",
"3": "Expert-level nuance including edge cases and constraint interactions"
},
"score": null
},
"constraint_prioritization": {
"weight": 0.1,
"type": "human",
"description": "Correct handling of ambiguity and conflicting constraints",
"score": null
}
},
"passing_threshold": 0.6,
"hard_constraint_failure_zeroes_dimension": true
},
"reference_solution": {
"_status": "EXPERT_REVIEWED",
"recommended_cards": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite"
],
"total_ev_usd": 24995.0,
"ev_breakdown": {
"signup_bonuses_usd": 25340.0,
"ongoing_rewards_usd": 4980.0,
"credits_usd": 0.0,
"annual_fees_usd": -5325.0,
"other_usd": 0.0
},
"housing_option": null,
"key_constraints_flags": [
"high_spend",
"business_cards",
"signup_bonus_churn",
"shutdown_risk"
],
"expert_notes": "High-spend bonus churn strategy. $20k/mo spend over 2 years = $480k total. Chase business cards first (5/24), then Cap1, Amex, Citi, BofA. Cancel/downgrade after year 1 except Venture X and Amex Platinum (keeper cards). Venture X for remaining spend after bonuses at 2x ($249k * 2 * 1.85cpp = $4,980). Total bonuses $30,320 minus fees $5,325 = $24,995."
}
}