Spaces:

krishuggingface
/

CyberAttack-PLL

Sleeping

App Files Files Community

krishuggingface commited on 12 days ago

Commit

4c2a495

1 Parent(s): 82e7138

Restore 500 steps, LLM every step with circuit breaker, use requests.Session for speed

Browse files

Files changed (3) hide show

inference.py +18 -10
openenv.yaml +4 -4
src/env.py +1 -1

inference.py CHANGED Viewed

@@ -32,6 +32,9 @@ ENV_URL      = os.environ.get("ENV_URL",      "http://localhost:7860")
 # OpenAI client pointed at the proxy — never bypass this
 client = OpenAI(base_url=API_BASE_URL, api_key=API_KEY)
 # ── Task metadata ─────────────────────────────────────────────────────────────
 TASK_NAMES = {
     0: "Sinusoidal FDI Detection (Easy)",
@@ -295,11 +298,19 @@ def format_observation(obs: dict) -> str:
         f"raw_voltages: {[round(v, 6) for v in obs['raw_voltages']]}",
     ])
 def llm_agent(obs: dict) -> dict:
     """Primary agent — calls the LLM through the injected proxy.
     Falls back to heuristic only if the API call itself raises an exception.
     """
     try:
         completion = client.chat.completions.create(
             model=MODEL_NAME,
@@ -313,7 +324,8 @@ def llm_agent(obs: dict) -> dict:
         )
         return parse_llm_response(completion.choices[0].message.content or "")
     except Exception as e:
-        print(f"[DEBUG] LLM error ({type(e).__name__}: {e}), falling back to heuristic", file=sys.stderr, flush=True)
         return heuristic_agent(obs)
 # ── Episode runner ────────────────────────────────────────────────────────────
@@ -333,7 +345,7 @@ def run_episode(task_id: int) -> float:
     success      = False
     try:
-        reset_resp = requests.post(
             f"{ENV_URL}/reset",
             json={"task_id": task_id},
             timeout=60,
@@ -346,14 +358,10 @@ def run_episode(task_id: int) -> float:
         info         = {}
         while not done:
-            # Frame skipping: only invoke the LLM every 10 steps to prevent 30-min evaluation timeouts.
-            # Step skips use the heuristics to keep episode run-time blazing fast.
-            if step_count % 10 == 0:
-                action = llm_agent(obs)
-            else:
-                action = heuristic_agent(obs)
-            step_resp = requests.post(
                 f"{ENV_URL}/step",
                 json=action,
                 timeout=60,
@@ -404,7 +412,7 @@ def wait_for_server(env_url: str, timeout: int = 60) -> bool:
     start_t = time.time()
     while time.time() - start_t < timeout:
         try:
-            resp = requests.get(f"{env_url}/health", timeout=2)
             if resp.status_code == 200:
                 print("[DEBUG] Environment server is up!", file=sys.stderr, flush=True)
                 return True

 # OpenAI client pointed at the proxy — never bypass this
 client = OpenAI(base_url=API_BASE_URL, api_key=API_KEY)
+# Persistent HTTP session for env calls — avoids TCP handshake per step
+_session = requests.Session()
 # ── Task metadata ─────────────────────────────────────────────────────────────
 TASK_NAMES = {
     0: "Sinusoidal FDI Detection (Easy)",
         f"raw_voltages: {[round(v, 6) for v in obs['raw_voltages']]}",
     ])
+_llm_disabled = False  # circuit breaker — flips True after first LLM failure
 def llm_agent(obs: dict) -> dict:
     """Primary agent — calls the LLM through the injected proxy.
     Falls back to heuristic only if the API call itself raises an exception.
+    Uses a circuit breaker: after the first failure, all future calls skip the
+    network request and go straight to heuristic (restoring ~10s runtime).
     """
+    global _llm_disabled
+    if _llm_disabled:
+        return heuristic_agent(obs)
     try:
         completion = client.chat.completions.create(
             model=MODEL_NAME,
         )
         return parse_llm_response(completion.choices[0].message.content or "")
     except Exception as e:
+        print(f"[DEBUG] LLM error ({type(e).__name__}: {e}), disabling LLM for remaining steps", file=sys.stderr, flush=True)
+        _llm_disabled = True
         return heuristic_agent(obs)
 # ── Episode runner ────────────────────────────────────────────────────────────
     success      = False
     try:
+        reset_resp = _session.post(
             f"{ENV_URL}/reset",
             json={"task_id": task_id},
             timeout=60,
         info         = {}
         while not done:
+            # LLM is primary; circuit breaker auto-disables after first failure
+            action = llm_agent(obs)
+            step_resp = _session.post(
                 f"{ENV_URL}/step",
                 json=action,
                 timeout=60,
     start_t = time.time()
     while time.time() - start_t < timeout:
         try:
+            resp = _session.get(f"{env_url}/health", timeout=2)
             if resp.status_code == 200:
                 print("[DEBUG] Environment server is up!", file=sys.stderr, flush=True)
                 return True

openenv.yaml CHANGED Viewed

@@ -46,20 +46,20 @@ tasks:
     numeric_id: 0
     grader: time_to_detection
     max_score: 1.0
-    episode_length: 250
     description: Detect sinusoidal FDI attack within 100 steps of attack start
   - id: multi_attack_classification
     difficulty: medium
     numeric_id: 1
     grader: classification_accuracy
     max_score: 1.0
-    episode_length: 250
     description: Classify attack type from observation window
   - id: stealthy_attack_detection
     difficulty: hard
     numeric_id: 2
     grader: pre_lock_loss_detection
     max_score: 1.0
-    episode_length: 250
     description: Detect stealthy low-amplitude attack before PLL loss-of-lock
-episode_length: 250

     numeric_id: 0
     grader: time_to_detection
     max_score: 1.0
+    episode_length: 500
     description: Detect sinusoidal FDI attack within 100 steps of attack start
   - id: multi_attack_classification
     difficulty: medium
     numeric_id: 1
     grader: classification_accuracy
     max_score: 1.0
+    episode_length: 500
     description: Classify attack type from observation window
   - id: stealthy_attack_detection
     difficulty: hard
     numeric_id: 2
     grader: pre_lock_loss_detection
     max_score: 1.0
+    episode_length: 500
     description: Detect stealthy low-amplitude attack before PLL loss-of-lock
+episode_length: 500

src/env.py CHANGED Viewed

@@ -27,7 +27,7 @@ from src.detector import AdaptiveDetector
 WINDOW_SIZE = 20
-MAX_STEPS = 250
 LOCK_LOSS_THRESHOLD = 0.0873  # 5 degrees in radians
 DETECTION_THRESHOLD = 2.0

 WINDOW_SIZE = 20
+MAX_STEPS = 500
 LOCK_LOSS_THRESHOLD = 0.0873  # 5 degrees in radians
 DETECTION_THRESHOLD = 2.0