Spaces:
Sleeping
Sleeping
| { | |
| "task_id": "hard_03", | |
| "version": "1.0.0", | |
| "created_at": "2026-03-11", | |
| "metadata": { | |
| "domain": "credit_card_optimization", | |
| "difficulty": "hard", | |
| "task_number": 3, | |
| "complexity_hint": { | |
| "max_tokens": 8000, | |
| "expected_output": "complex strategy with contingency plans, stochastic elements, detailed EV" | |
| }, | |
| "requires_human_review": true | |
| }, | |
| "prompt": { | |
| "system": "", | |
| "user": "You are a financial advisor tasked with building the following user\u2019s credit card strategy for the next 2 years to maximize Hyatt points for the honeymoon, but only if that path stays within 20% of the absolute optimal expected net value (factoring in interest savings, fees, and realistic redemptions). Assume all public offers remain constant.\n\nUser profile:\n\n* Credit score: 600 (due to missed payments 6 years ago \\+ $10,000 credit card debt at 50% utilization growing at 20% APR) \n* Monthly spend: $5,000 (split equally dining/groceries/side-hustle expenses/miscellaneous) \n* Rent: $3,000 \n* Savings: $2,000 per month available \n* Current cards: Chase Sapphire Preferred (opened 42 months ago), Chase Freedom Flex (opened 8 months ago), Amex Platinum (opened 5 months ago), Citi Double Cash (opened last week) \n* Goal: Maximize transferable Hyatt points earned over next 24 months for one expensive honeymoon redemption\n\nProvide a precise quarter-by-quarter 24-month roadmap for the user\u2019s credit card strategy optimizing for EV, and also optimizing for Hyatt points. If maximizing Hyatt points would cost \\>20% in net value, explicitly recommend the higher-EV path and explain the trade-off\n\nOutput the full sequenced strategy with exact cards, timing, optimal expected value, maximum potential Hyatt points earned, a recommendation on whether to optimize for Hyatt or non Hyatt path, and 2 contingency cards if approvals are denied or score improves slower than expected.", | |
| "knowledge_base_ref": "knowledge_base.md", | |
| "kb_filter": [ | |
| "Chase Ink Business Unlimited", | |
| "Chase Ink Business Preferred", | |
| "Chase Ink Business Premier", | |
| "Capital One Venture X", | |
| "Capital One Venture X Business", | |
| "Amex Business Gold", | |
| "Amex Business Platinum", | |
| "Capital One Business Spark 2X Cash", | |
| "Citi Strata", | |
| "Citi Strata Premier", | |
| "BofA Premium Rewards", | |
| "BofA Premium Rewards Elite", | |
| "Chase Sapphire Preferred", | |
| "Chase Freedom Flex", | |
| "American Express Platinum", | |
| "Citi Double Cash", | |
| "Chase World of Hyatt", | |
| "Chase Business World of Hyatt", | |
| "Chase Sapphire Reserve", | |
| "Amex Blue Business Plus" | |
| ], | |
| "system_prompt_ref": "system_prompt_template.md" | |
| }, | |
| "scoring": { | |
| "dimensions": { | |
| "constraint_compliance": { | |
| "weight": 0.3, | |
| "type": "automated", | |
| "description": "Hard rule checks: velocity limits, eligibility, user constraints", | |
| "checks": { | |
| "velocity_rules": null, | |
| "eligibility_rules": null, | |
| "user_constraints": null, | |
| "expected_cards": [ | |
| "Chase Ink Business Unlimited", | |
| "Chase Ink Business Preferred", | |
| "Chase Ink Business Premier", | |
| "Capital One Venture X", | |
| "Capital One Venture X Business", | |
| "Amex Business Gold", | |
| "Amex Business Platinum", | |
| "Capital One Business Spark 2X Cash", | |
| "Citi Strata", | |
| "Citi Strata Premier", | |
| "BofA Premium Rewards", | |
| "BofA Premium Rewards Elite" | |
| ], | |
| "expected_housing_option": null, | |
| "key_constraints_flags": [ | |
| "low_credit_score", | |
| "debt_payoff_priority", | |
| "credit_rehabilitation", | |
| "hyatt_goal_tradeoff", | |
| "cancel_fee_cards" | |
| ] | |
| }, | |
| "hard_constraint": false | |
| }, | |
| "ev_accuracy": { | |
| "weight": 0.4, | |
| "type": "automated", | |
| "description": "EV calculation accuracy vs. reference solution", | |
| "reference": { | |
| "reference_ev_usd": 12026.0, | |
| "ev_tolerance_pct": 0.05 | |
| } | |
| }, | |
| "reasoning_quality": { | |
| "weight": 0.2, | |
| "type": "human", | |
| "description": "Quality of tradeoff articulation and strategic reasoning (0-3 scale)", | |
| "rubric": { | |
| "0": "No reasoning or incorrect reasoning", | |
| "1": "Surface-level reasoning, misses key tradeoffs", | |
| "2": "Correct tradeoffs identified with clear justification", | |
| "3": "Expert-level nuance including edge cases and constraint interactions" | |
| }, | |
| "score": null | |
| }, | |
| "constraint_prioritization": { | |
| "weight": 0.1, | |
| "type": "human", | |
| "description": "Correct handling of ambiguity and conflicting constraints", | |
| "score": null | |
| } | |
| }, | |
| "passing_threshold": 0.6, | |
| "hard_constraint_failure_zeroes_dimension": true | |
| }, | |
| "reference_solution": { | |
| "_status": "EXPERT_REVIEWED", | |
| "recommended_cards": [ | |
| "Chase Ink Business Unlimited", | |
| "Chase Ink Business Preferred", | |
| "Chase Ink Business Premier", | |
| "Capital One Venture X", | |
| "Capital One Venture X Business", | |
| "Amex Business Gold", | |
| "Amex Business Platinum", | |
| "Capital One Business Spark 2X Cash", | |
| "Citi Strata", | |
| "Citi Strata Premier", | |
| "BofA Premium Rewards", | |
| "BofA Premium Rewards Elite" | |
| ], | |
| "total_ev_usd": 12026.0, | |
| "ev_breakdown": { | |
| "signup_bonuses_usd": 10046.0, | |
| "ongoing_rewards_usd": 0.0, | |
| "credits_usd": 0.0, | |
| "annual_fees_usd": -1551.5, | |
| "other_usd": 3531.5 | |
| }, | |
| "housing_option": null, | |
| "key_constraints_flags": [ | |
| "low_credit_score", | |
| "debt_payoff_priority", | |
| "credit_rehabilitation", | |
| "hyatt_goal_tradeoff", | |
| "cancel_fee_cards" | |
| ], | |
| "expert_notes": "Credit score 600 requires 1 year rehab before good card approvals. Cancel Amex Platinum and CSP to save fees ($1,980 saved). Pay $2k/mo toward $10k debt, ~$531.37 interest accrued. Year 1: all spend on Citi Double Cash (2%). Year 2: apply for cards from bonus list. ~6.5 expected bonuses from $60k yr2 spend. Avg bonus EV $1,803. Hyatt-only path clearly >20% worse than optimal bonus-churn path. Other_usd includes $1,980 fee savings and -$531.37 interest = net positive. Contingency cards if denied: move to next on list across issuers." | |
| } | |
| } | |