Spaces:

Codex47
/

SmartContractAudit

Running

App Files Files Community

ajaxwin commited on 12 days ago

Commit

45bd962

1 Parent(s): 17ed3a7

fix: Update file paths and ensure model loading in PropertyRetriever

Browse files

Files changed (5) hide show

README.md +1 -1
server/app.py +3 -3
server/index.html +3 -7
server/tasks/task2/actions.py +2 -1
utils/propertyretriever.py +14 -5

README.md CHANGED Viewed

@@ -297,7 +297,7 @@ curl http://localhost:7860/health
 ```bash
 pip install -r requirements.txt
-uvicorn api.app:app --host 0.0.0.0 --port 7860 --reload
 ```
 ### Validate OpenEnv Compliance

 ```bash
 pip install -r requirements.txt
+uvicorn server.app:app --host 0.0.0.0 --port 7860 --reload
 ```
 ### Validate OpenEnv Compliance

server/app.py CHANGED Viewed

@@ -17,7 +17,7 @@ If omitted, "default" is used (fine for sequential single-agent runs).
 """
 from typing import Dict, Optional, Union
-from zipfile import Path
 from fastapi import FastAPI, HTTPException, Query, Request
 from fastapi.responses import FileResponse, JSONResponse
@@ -117,8 +117,8 @@ def root(request: Request):
     - API clients (Accept: */*)     → JSON summary
     """
     accept = request.headers.get("accept", "")
-    if "text/html" in accept and Path("./index.html").is_file():
-        return FileResponse("./index.html", media_type="text/html", status_code=200)
     return JSONResponse(content=_ROOT_JSON, status_code=200)
 @app.get("/health")

 """
 from typing import Dict, Optional, Union
+from pathlib import Path
 from fastapi import FastAPI, HTTPException, Query, Request
 from fastapi.responses import FileResponse, JSONResponse
     - API clients (Accept: */*)     → JSON summary
     """
     accept = request.headers.get("accept", "")
+    if "text/html" in accept and Path("server/index.html").is_file():
+        return FileResponse("server/index.html", media_type="text/html", status_code=200)
     return JSONResponse(content=_ROOT_JSON, status_code=200)
 @app.get("/health")

server/index.html CHANGED Viewed

@@ -1,9 +1,4 @@
-# ─────────────────────────────────────────────────────────────────────────────
-# Landing page HTML
-# ─────────────────────────────────────────────────────────────────────────────
-LANDING_HTML = """<!DOCTYPE html>
 <html lang="en">
 <head>
   <meta charset="UTF-8" />
@@ -11,6 +6,7 @@ LANDING_HTML = """<!DOCTYPE html>
   <title>SC Audit RL Environment</title>
   <link rel="preconnect" href="https://fonts.googleapis.com" />
   <link href="https://fonts.googleapis.com/css2?family=Space+Mono:wght@400;700&family=DM+Sans:wght@300;400;500&display=swap" rel="stylesheet" />
   <style>
     *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
@@ -705,4 +701,4 @@ LANDING_HTML = """<!DOCTYPE html>
   }
 </script>
 </body>
-</html>"""

+<!DOCTYPE html>
 <html lang="en">
 <head>
   <meta charset="UTF-8" />
   <title>SC Audit RL Environment</title>
   <link rel="preconnect" href="https://fonts.googleapis.com" />
   <link href="https://fonts.googleapis.com/css2?family=Space+Mono:wght@400;700&family=DM+Sans:wght@300;400;500&display=swap" rel="stylesheet" />
+  <link rel="icon" type="image/svg+xml" href="data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' viewBox='0 0 24 24'%3E%3Cpath d='M12 2L4.5 5.5V10.5C4.5 15.14 7.7 19.46 12 20.5C16.3 19.46 19.5 15.14 19.5 10.5V5.5L12 2Z' fill='none' stroke='%2300ff88' stroke-width='2'/%3E%3Crect x='10.5' y='9.5' width='3' height='3' rx='0.5' fill='%2300ff88'/%3E%3C/svg%3E">
   <style>
     *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
   }
 </script>
 </body>
+</html>

server/tasks/task2/actions.py CHANGED Viewed

@@ -93,7 +93,8 @@ def get_similar_rule_action(ctx: Any, qkey: str, params: Dict) -> Tuple[str, Rew
     """Handle GET_SIMILAR_RULE action."""
     if ctx._is_repeated(qkey):
         return "Repeated query.", Reward(value=-0.40, reason="Repeated query")
     similar_rule = PropertyRetrieverInstance.get_similar_property(ctx._target_fn["code"])
     if similar_rule is None:
         return (

     """Handle GET_SIMILAR_RULE action."""
     if ctx._is_repeated(qkey):
         return "Repeated query.", Reward(value=-0.40, reason="Repeated query")
+    PropertyRetrieverInstance.load_model()  # Ensure model is loaded before querying
     similar_rule = PropertyRetrieverInstance.get_similar_property(ctx._target_fn["code"])
     if similar_rule is None:
         return (

utils/propertyretriever.py CHANGED Viewed

@@ -8,9 +8,9 @@ and provides a method to retrieve the most similar property given a new code sni
 import pandas as pd
 import numpy as np
-from sentence_transformers import SentenceTransformer
 from sklearn.preprocessing import normalize
 from data.data_loader import DEFAULT_CSV_PATH
 SIMILARITY_THRESHOLD = 0.8  # Adjust as needed based on validation
@@ -30,9 +30,17 @@ class PropertyRetriever:
         """
         self.df = pd.read_csv(DEFAULT_CSV_PATH)
         self.threshold = SIMILARITY_THRESHOLD
-        # Use a lightweight, open‑source embedding model
-        self.embedder = SentenceTransformer('all-MiniLM-L6-v2')
         # Extract "critical code" from each property (use FunctionBodies)
         # Fallback to RelatedFunctions or RuleContent if FunctionBodies is missing
@@ -47,9 +55,10 @@ class PropertyRetriever:
             self.critical_codes.append(str(code))
         # Compute embeddings for all critical codes
-        self.embeddings = self.embedder.encode(self.critical_codes, show_progress_bar=True)
         # Normalize for dot product = cosine similarity
         self.embeddings = normalize(self.embeddings, norm='l2')
     def get_similar_property(self, input_code: str) -> str:
         """
@@ -60,7 +69,7 @@ class PropertyRetriever:
             return ""
         # Step ②: Embed the subject code
-        query_emb = self.embedder.encode([input_code])
         query_emb = normalize(query_emb, norm='l2')
         # Step ③: Compute dot products with all database vectors

 import pandas as pd
 import numpy as np
 from sklearn.preprocessing import normalize
 from data.data_loader import DEFAULT_CSV_PATH
+from dotenv import dotenv_values
 SIMILARITY_THRESHOLD = 0.8  # Adjust as needed based on validation
         """
         self.df = pd.read_csv(DEFAULT_CSV_PATH)
         self.threshold = SIMILARITY_THRESHOLD
+        self.embedder = None
+    def load_model(self):
+        """Use a lightweight, open‑source embedding model."""
+        if self.embedder is not None:
+            from sentence_transformers import SentenceTransformer
+            self.embedder = SentenceTransformer(
+                'all-MiniLM-L6-v2',
+                use_auth_token=dotenv_values(".env").get('HF_TOKEN', '')
+            )
         # Extract "critical code" from each property (use FunctionBodies)
         # Fallback to RelatedFunctions or RuleContent if FunctionBodies is missing
             self.critical_codes.append(str(code))
         # Compute embeddings for all critical codes
+        self.embeddings = self.embedder.encode(self.critical_codes, show_progress_bar=True) #type: ignore
         # Normalize for dot product = cosine similarity
         self.embeddings = normalize(self.embeddings, norm='l2')
     def get_similar_property(self, input_code: str) -> str:
         """
             return ""
         # Step ②: Embed the subject code
+        query_emb = self.embedder.encode([input_code]) #type: ignore
         query_emb = normalize(query_emb, norm='l2')
         # Step ③: Compute dot products with all database vectors