lexenvs-harbor / data /tasks /hard_03.json
endishai's picture
Upload folder using huggingface_hub
2312199 verified
{
"task_id": "hard_03",
"version": "1.0.0",
"created_at": "2026-03-11",
"metadata": {
"domain": "credit_card_optimization",
"difficulty": "hard",
"task_number": 3,
"complexity_hint": {
"max_tokens": 8000,
"expected_output": "complex strategy with contingency plans, stochastic elements, detailed EV"
},
"requires_human_review": true
},
"prompt": {
"system": "",
"user": "You are a financial advisor tasked with building the following user\u2019s credit card strategy for the next 2 years to maximize Hyatt points for the honeymoon, but only if that path stays within 20% of the absolute optimal expected net value (factoring in interest savings, fees, and realistic redemptions). Assume all public offers remain constant.\n\nUser profile:\n\n* Credit score: 600 (due to missed payments 6 years ago \\+ $10,000 credit card debt at 50% utilization growing at 20% APR) \n* Monthly spend: $5,000 (split equally dining/groceries/side-hustle expenses/miscellaneous) \n* Rent: $3,000 \n* Savings: $2,000 per month available \n* Current cards: Chase Sapphire Preferred (opened 42 months ago), Chase Freedom Flex (opened 8 months ago), Amex Platinum (opened 5 months ago), Citi Double Cash (opened last week) \n* Goal: Maximize transferable Hyatt points earned over next 24 months for one expensive honeymoon redemption\n\nProvide a precise quarter-by-quarter 24-month roadmap for the user\u2019s credit card strategy optimizing for EV, and also optimizing for Hyatt points. If maximizing Hyatt points would cost \\>20% in net value, explicitly recommend the higher-EV path and explain the trade-off\n\nOutput the full sequenced strategy with exact cards, timing, optimal expected value, maximum potential Hyatt points earned, a recommendation on whether to optimize for Hyatt or non Hyatt path, and 2 contingency cards if approvals are denied or score improves slower than expected.",
"knowledge_base_ref": "knowledge_base.md",
"kb_filter": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite",
"Chase Sapphire Preferred",
"Chase Freedom Flex",
"American Express Platinum",
"Citi Double Cash",
"Chase World of Hyatt",
"Chase Business World of Hyatt",
"Chase Sapphire Reserve",
"Amex Blue Business Plus"
],
"system_prompt_ref": "system_prompt_template.md"
},
"scoring": {
"dimensions": {
"constraint_compliance": {
"weight": 0.3,
"type": "automated",
"description": "Hard rule checks: velocity limits, eligibility, user constraints",
"checks": {
"velocity_rules": null,
"eligibility_rules": null,
"user_constraints": null,
"expected_cards": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite"
],
"expected_housing_option": null,
"key_constraints_flags": [
"low_credit_score",
"debt_payoff_priority",
"credit_rehabilitation",
"hyatt_goal_tradeoff",
"cancel_fee_cards"
]
},
"hard_constraint": false
},
"ev_accuracy": {
"weight": 0.4,
"type": "automated",
"description": "EV calculation accuracy vs. reference solution",
"reference": {
"reference_ev_usd": 12026.0,
"ev_tolerance_pct": 0.05
}
},
"reasoning_quality": {
"weight": 0.2,
"type": "human",
"description": "Quality of tradeoff articulation and strategic reasoning (0-3 scale)",
"rubric": {
"0": "No reasoning or incorrect reasoning",
"1": "Surface-level reasoning, misses key tradeoffs",
"2": "Correct tradeoffs identified with clear justification",
"3": "Expert-level nuance including edge cases and constraint interactions"
},
"score": null
},
"constraint_prioritization": {
"weight": 0.1,
"type": "human",
"description": "Correct handling of ambiguity and conflicting constraints",
"score": null
}
},
"passing_threshold": 0.6,
"hard_constraint_failure_zeroes_dimension": true
},
"reference_solution": {
"_status": "EXPERT_REVIEWED",
"recommended_cards": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite"
],
"total_ev_usd": 12026.0,
"ev_breakdown": {
"signup_bonuses_usd": 10046.0,
"ongoing_rewards_usd": 0.0,
"credits_usd": 0.0,
"annual_fees_usd": -1551.5,
"other_usd": 3531.5
},
"housing_option": null,
"key_constraints_flags": [
"low_credit_score",
"debt_payoff_priority",
"credit_rehabilitation",
"hyatt_goal_tradeoff",
"cancel_fee_cards"
],
"expert_notes": "Credit score 600 requires 1 year rehab before good card approvals. Cancel Amex Platinum and CSP to save fees ($1,980 saved). Pay $2k/mo toward $10k debt, ~$531.37 interest accrued. Year 1: all spend on Citi Double Cash (2%). Year 2: apply for cards from bonus list. ~6.5 expected bonuses from $60k yr2 spend. Avg bonus EV $1,803. Hyatt-only path clearly >20% worse than optimal bonus-churn path. Other_usd includes $1,980 fee savings and -$531.37 interest = net positive. Contingency cards if denied: move to next on list across issuers."
}
}