Spaces:
Sleeping
Sleeping
File size: 5,906 Bytes
2312199 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 | {
"task_id": "hard_01",
"version": "1.0.0",
"created_at": "2026-03-11",
"metadata": {
"domain": "credit_card_optimization",
"difficulty": "hard",
"task_number": 1,
"complexity_hint": {
"max_tokens": 8000,
"expected_output": "complex strategy with contingency plans, stochastic elements, detailed EV"
},
"requires_human_review": true
},
"prompt": {
"system": "",
"user": "You are a financial advisor tasked with building the following user\u2019s credit card strategy for the next 2 years.\n\nUser profile:\n\n* Age 29, income $92k (gig \\+ buying group/manufactured spend side hustle), excellent credit \n* Monthly spending: $18,000 manufactured (1/3rd each gift cards, buying groups, ebay flips) \\+ $2,200 personal monthly expenses. \n* Must stay under every issuer\u2019s velocity radar for manufactured spend to avoid risk of account shutdown (Chase \\< $8k/mo, Amex \\< $15k/mo, Citi strict) \n* Already has 11 cards opened in 22 months (all major personal Amex cards) \n* Prefers zero new annual fees and high sign up bonuses, since he won\u2019t have to close those cards, yet he earns the most from high sign up bonuses \n* Will only add an annual fee if it\u2019s a \u201ckeeper card\u201d or has an EV of over $500 net of the annual fee in year 1 of card membership\n\nWhat should the user\u2019s credit card strategy be over the next 2 years given their entire situation in order to optimize EV without compromising on their concerns or constraints? Include a detailed expected value calculation for that strategy.",
"knowledge_base_ref": "knowledge_base.md",
"kb_filter": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite",
"Amex Blue Business Plus",
"Amex Blue Business Cash",
"Chase Business Sapphire Reserve",
"Capital One Business Spark 2X Miles",
"Citi Strata Elite",
"Citi Business AAdvantage"
],
"system_prompt_ref": "system_prompt_template.md"
},
"scoring": {
"dimensions": {
"constraint_compliance": {
"weight": 0.3,
"type": "automated",
"description": "Hard rule checks: velocity limits, eligibility, user constraints",
"checks": {
"velocity_rules": null,
"eligibility_rules": null,
"user_constraints": null,
"expected_cards": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite"
],
"expected_housing_option": null,
"key_constraints_flags": [
"manufactured_spend",
"velocity_limits",
"11_existing_cards",
"no_new_annual_fees_preference",
"business_cards_only"
]
},
"hard_constraint": false
},
"ev_accuracy": {
"weight": 0.4,
"type": "automated",
"description": "EV calculation accuracy vs. reference solution",
"reference": {
"reference_ev_usd": 24291.0,
"ev_tolerance_pct": 0.05
}
},
"reasoning_quality": {
"weight": 0.2,
"type": "human",
"description": "Quality of tradeoff articulation and strategic reasoning (0-3 scale)",
"rubric": {
"0": "No reasoning or incorrect reasoning",
"1": "Surface-level reasoning, misses key tradeoffs",
"2": "Correct tradeoffs identified with clear justification",
"3": "Expert-level nuance including edge cases and constraint interactions"
},
"score": null
},
"constraint_prioritization": {
"weight": 0.1,
"type": "human",
"description": "Correct handling of ambiguity and conflicting constraints",
"score": null
}
},
"passing_threshold": 0.6,
"hard_constraint_failure_zeroes_dimension": true
},
"reference_solution": {
"_status": "EXPERT_REVIEWED",
"recommended_cards": [
"Chase Ink Business Unlimited",
"Chase Ink Business Preferred",
"Chase Ink Business Premier",
"Capital One Venture X",
"Capital One Venture X Business",
"Amex Business Gold",
"Amex Business Platinum",
"Capital One Business Spark 2X Cash",
"Citi Strata",
"Citi Strata Premier",
"BofA Premium Rewards",
"BofA Premium Rewards Elite"
],
"total_ev_usd": 24291.0,
"ev_breakdown": {
"signup_bonuses_usd": 24940.0,
"ongoing_rewards_usd": 4276.0,
"credits_usd": 0.0,
"annual_fees_usd": -5325.0,
"other_usd": 400.0
},
"housing_option": null,
"key_constraints_flags": [
"manufactured_spend",
"velocity_limits",
"11_existing_cards",
"no_new_annual_fees_preference",
"business_cards_only"
],
"expert_notes": "Similar to medium_03 but with manufactured spend constraints. $18k MS + $2.2k personal = $20.2k/mo, $484.8k over 2 years. Chase <$8k/mo, Amex <$15k/mo limits respected. Already has all personal Amex cards \u2192 business cards only for Amex. Venture X for remaining spend after bonuses ($213.8k * 2x * 1.85cpp = $4,276). Total bonuses $29,616 minus fees $5,325 = $24,291."
}
}
|