agent-cost-optimizer / eval /ablation_results.json
narcolepticchicken's picture
Upload eval/ablation_results.json with huggingface_hub
946830d verified
{
"full_v10": {
"success": 0.718,
"avg_cost": 0.016932746258400005,
"costRed": 94.65337977316072
},
"no_feedback": {
"success": 0.632,
"avg_cost": 0.014239461958399993,
"costRed": 95.50380108670666
},
"no_cascade": {
"success": 0.632,
"avg_cost": 0.014239461958399993,
"costRed": 95.50380108670666
},
"heuristic": {
"success": 0.57,
"avg_cost": 0.04103160790880004,
"costRed": 87.04401392207134
},
"always_frontier": {
"success": 0.782,
"avg_cost": 0.3166872804999999,
"costRed": 0.004016261446193603
},
"always_cheap": {
"success": 0.632,
"avg_cost": 0.014239461958399993,
"costRed": 95.50380108670666
}
}