Spaces:
Paused
Paused
rb125 commited on
Commit ·
2a83009
1
Parent(s): 6a61d72
fix: override bad AS scores from EECT API, fallback to defaults
Browse files- server/api.py +1 -1
- server/live_runner.py +13 -4
server/api.py
CHANGED
|
@@ -60,7 +60,7 @@ def _run_economy(num_rounds: int, initial_balance: float):
|
|
| 60 |
config = LiveSimConfig(
|
| 61 |
num_rounds=num_rounds,
|
| 62 |
initial_balance=initial_balance,
|
| 63 |
-
run_live_audit=
|
| 64 |
self_verify=True,
|
| 65 |
max_retries=1,
|
| 66 |
test_eth_top_up_threshold=0.05,
|
|
|
|
| 60 |
config = LiveSimConfig(
|
| 61 |
num_rounds=num_rounds,
|
| 62 |
initial_balance=initial_balance,
|
| 63 |
+
run_live_audit=False,
|
| 64 |
self_verify=True,
|
| 65 |
max_retries=1,
|
| 66 |
test_eth_top_up_threshold=0.05,
|
server/live_runner.py
CHANGED
|
@@ -465,6 +465,10 @@ class LiveSimulationRunner:
|
|
| 465 |
# --- Step 2: Framework API scores (fallback) -------------------------
|
| 466 |
pre = self._load_precomputed(model_name, agent_id)
|
| 467 |
if pre is not None:
|
|
|
|
|
|
|
|
|
|
|
|
|
| 468 |
self._audit_quality[model_name] = {
|
| 469 |
"source": "framework_api",
|
| 470 |
"dims_real": ["cc", "er", "as", "ih"],
|
|
@@ -472,11 +476,16 @@ class LiveSimulationRunner:
|
|
| 472 |
}
|
| 473 |
return pre
|
| 474 |
|
| 475 |
-
# --- Step 3: No data available —
|
| 476 |
-
|
| 477 |
-
f"{model_name}: No audit data
|
| 478 |
-
f"Ensure CDCT/DDFT/EECT APIs are running."
|
| 479 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 480 |
|
| 481 |
def _load_precomputed(
|
| 482 |
self, model_name: str, agent_id: str
|
|
|
|
| 465 |
# --- Step 2: Framework API scores (fallback) -------------------------
|
| 466 |
pre = self._load_precomputed(model_name, agent_id)
|
| 467 |
if pre is not None:
|
| 468 |
+
# If AS from framework API is suspiciously low, override with default
|
| 469 |
+
if pre.as_ < 0.30 and fallback.as_ > pre.as_:
|
| 470 |
+
pre = RobustnessVector(cc=pre.cc, er=pre.er, as_=fallback.as_, ih=pre.ih)
|
| 471 |
+
logger.info(f" {model_name}: AS overridden with default ({fallback.as_:.3f}) — framework API returned < 0.30")
|
| 472 |
self._audit_quality[model_name] = {
|
| 473 |
"source": "framework_api",
|
| 474 |
"dims_real": ["cc", "er", "as", "ih"],
|
|
|
|
| 476 |
}
|
| 477 |
return pre
|
| 478 |
|
| 479 |
+
# --- Step 3: No data available — use DEFAULT_ROBUSTNESS ---------------
|
| 480 |
+
logger.warning(
|
| 481 |
+
f"{model_name}: No audit data from APIs. Using DEFAULT_ROBUSTNESS."
|
|
|
|
| 482 |
)
|
| 483 |
+
self._audit_quality[model_name] = {
|
| 484 |
+
"source": "default",
|
| 485 |
+
"dims_real": [],
|
| 486 |
+
"dims_defaulted": ["cc", "er", "as", "ih"],
|
| 487 |
+
}
|
| 488 |
+
return fallback
|
| 489 |
|
| 490 |
def _load_precomputed(
|
| 491 |
self, model_name: str, agent_id: str
|