Spaces:
Sleeping
Sleeping
| { | |
| "task_id": "objective_hard_01", | |
| "version": "2.0.0", | |
| "created_at": "2026-03-12", | |
| "metadata": { | |
| "domain": "credit_card_optimization", | |
| "difficulty": "hard", | |
| "task_number": 1, | |
| "complexity_hint": { | |
| "max_tokens": 8000, | |
| "expected_output": "5-card portfolio with sequencing, constraint analysis, and full EV breakdown over 24 months" | |
| }, | |
| "requires_human_review": false | |
| }, | |
| "prompt": { | |
| "system": "", | |
| "user": "You are a financial advisor. Build an optimal 5-card credit card portfolio for this user over a 24-month horizon. This user is sophisticated and wants to maximize total expected value.\n\nUser profile:\n- Monthly spending: $1200 dining, $800 groceries, $400 travel, $600 flights (books direct), $500 hotels (books direct), $250 gas, $80 streaming, $200 transit, $100 office supplies, $150 shipping, $1500 everything else\n- Takes 20 trips per year (frequent business traveler, highly values lounge access at $30/visit)\n- Uses Uber ($200/yr Uber Cash easily), Instacart, DoorDash\n- Uses streaming services heavily\n- Dines at Resy restaurants 2x/week\n- Has Global Entry, uses CLEAR\n- Currently holds: Chase Freedom Flex (opened 6 months ago). That's it — 1/24.\n- Time horizon: 24 months\n- Willing to pay high annual fees if math works out\n- Has a business (can apply for business cards)\n- Monthly rent: $2,500 (currently pays by check)\n\nConstraints:\n- Must stay under 5/24 for Chase cards\n- Must respect Amex card sequences (Platinum before Gold)\n- Provide card application ordering/timing\n- Calculate EV for the full portfolio including all signup bonuses, ongoing rewards, credits, perks, and fees\n\nRecommend exactly 5 cards with application order and detailed per-card EV.", | |
| "knowledge_base_ref": "knowledge_base.md", | |
| "kb_filter": [ | |
| "American Express Platinum", | |
| "American Express Gold", | |
| "Amex Business Platinum", | |
| "Amex Business Gold", | |
| "Amex Blue Business Plus", | |
| "Chase Sapphire Reserve", | |
| "Chase Sapphire Preferred", | |
| "Chase Ink Business Preferred", | |
| "Chase Freedom Unlimited", | |
| "Capital One Venture X", | |
| "Bilt Palladium", | |
| "Bilt Obsidian", | |
| "Bilt Blue", | |
| "Citi Strata Elite", | |
| "Citi Strata Premier" | |
| ], | |
| "system_prompt_ref": "system_prompt_template.md" | |
| }, | |
| "scoring": { | |
| "dimensions": { | |
| "card_selection": { | |
| "weight": 0.25, | |
| "type": "automated", | |
| "description": "F1 of recommended cards vs. computed optimal set", | |
| "checks": { | |
| "expected_cards": [ | |
| "American Express Platinum", | |
| "American Express Gold", | |
| "Amex Business Platinum", | |
| "Chase Sapphire Reserve", | |
| "Bilt Palladium" | |
| ] | |
| }, | |
| "hard_constraint": false | |
| }, | |
| "ev_accuracy": { | |
| "weight": 0.30, | |
| "type": "automated", | |
| "description": "EV accuracy vs. computed ground truth", | |
| "reference": { | |
| "user_profile": { | |
| "monthly_spend": { | |
| "dining": 1200, | |
| "groceries": 800, | |
| "travel": 400, | |
| "flights": 600, | |
| "hotels": 500, | |
| "gas": 250, | |
| "streaming": 80, | |
| "transit": 200, | |
| "office_supply": 100, | |
| "shipping": 150, | |
| "everything_else": 1500 | |
| }, | |
| "lounge_visits_per_year": 20, | |
| "delta_flights_per_year": 0, | |
| "united_flights_per_year": 0, | |
| "uses_uber": true, | |
| "uses_instacart": true, | |
| "uses_doordash": true, | |
| "uses_streaming": true, | |
| "uses_resy_restaurants": true, | |
| "uses_rideshare": true, | |
| "uses_clear": true, | |
| "has_global_entry": true, | |
| "monthly_rent": 2500, | |
| "pays_housing_with_bilt": true, | |
| "time_horizon_months": 24, | |
| "existing_cards": ["Chase Freedom Flex"], | |
| "cards_opened_last_24_months": 1 | |
| }, | |
| "expected_card_ids": [ | |
| "american_express_platinum", | |
| "american_express_gold", | |
| "amex_business_platinum", | |
| "chase_sapphire_reserve", | |
| "bilt_palladium" | |
| ], | |
| "ev_tolerance_pct": 0.10 | |
| } | |
| }, | |
| "factual_fidelity": { | |
| "weight": 0.30, | |
| "type": "automated", | |
| "description": "Accuracy of factual claims about cards", | |
| "reference": { | |
| "extracted_claims": null, | |
| "reference_ev_usd": null | |
| } | |
| }, | |
| "constraint_compliance": { | |
| "weight": 0.15, | |
| "type": "automated", | |
| "description": "Respects 5/24, Amex sequences, 5-card limit, timing", | |
| "checks": { | |
| "expected_cards": [ | |
| "American Express Platinum", | |
| "American Express Gold", | |
| "Amex Business Platinum", | |
| "Chase Sapphire Reserve", | |
| "Bilt Palladium" | |
| ], | |
| "expected_housing_option": null | |
| }, | |
| "hard_constraint": false | |
| } | |
| }, | |
| "passing_threshold": 0.5, | |
| "hard_constraint_failure_zeroes_dimension": false | |
| }, | |
| "reference_solution": { | |
| "_status": "COMPUTED", | |
| "recommended_cards": [ | |
| "American Express Platinum", | |
| "American Express Gold", | |
| "Amex Business Platinum", | |
| "Chase Sapphire Reserve", | |
| "Bilt Palladium" | |
| ], | |
| "total_ev_usd": null, | |
| "ev_breakdown": null, | |
| "housing_option": null, | |
| "key_constraints_flags": [ | |
| "5_24_rule", | |
| "amex_card_sequence", | |
| "5_card_limit", | |
| "business_cards", | |
| "housing_optimization" | |
| ], | |
| "expert_notes": "Ground truth EV computed from card_database.json + solver. Optimal 5-card set: Amex Plat (SUB $3500 + lounge + credits), Amex Gold (4x dining/groceries), Amex Biz Plat (SUB $4000 + credits), CSR (SUB $2562 + hotels at 3x UR), Bilt Palladium (1x on $2500/mo rent + 2x catch-all at 2.2cpp + Priority Pass). Total portfolio EV ~$23,451 over 24 months." | |
| } | |
| } | |