Spaces:
Sleeping
Sleeping
v4.3 perf: Update chatbot.py
Browse files- chatbot.py +9 -5
chatbot.py
CHANGED
|
@@ -52,7 +52,9 @@ except ImportError:
|
|
| 52 |
_chatbot_status = {"embedder": "not_loaded", "llm": "not_loaded"}
|
| 53 |
|
| 54 |
def _load_embedder():
|
| 55 |
-
"""Load sentence-transformers embedding model (lazy).
|
|
|
|
|
|
|
| 56 |
global _embedder, _chatbot_status
|
| 57 |
if _embedder is not None:
|
| 58 |
return _embedder
|
|
@@ -60,10 +62,10 @@ def _load_embedder():
|
|
| 60 |
_chatbot_status["embedder"] = "unavailable"
|
| 61 |
return None
|
| 62 |
try:
|
| 63 |
-
print("[ClauseGuard Chat] Loading embedding model:
|
| 64 |
-
_embedder = SentenceTransformer("
|
| 65 |
_chatbot_status["embedder"] = "loaded"
|
| 66 |
-
print("[ClauseGuard Chat] Embedding model loaded")
|
| 67 |
return _embedder
|
| 68 |
except Exception as e:
|
| 69 |
_chatbot_status["embedder"] = f"failed: {e}"
|
|
@@ -194,7 +196,9 @@ def retrieve_chunks(query, chunks, embeddings, top_k=5):
|
|
| 194 |
return []
|
| 195 |
|
| 196 |
try:
|
| 197 |
-
|
|
|
|
|
|
|
| 198 |
scores = (q_emb @ embeddings.T)[0]
|
| 199 |
top_indices = np.argsort(scores)[::-1][:top_k]
|
| 200 |
|
|
|
|
| 52 |
_chatbot_status = {"embedder": "not_loaded", "llm": "not_loaded"}
|
| 53 |
|
| 54 |
def _load_embedder():
|
| 55 |
+
"""Load sentence-transformers embedding model (lazy).
|
| 56 |
+
PERF v4.3: Upgraded from all-MiniLM-L6-v2 to BAAI/bge-small-en-v1.5
|
| 57 |
+
(+21% MTEB retrieval accuracy, same 384-dim, same latency)."""
|
| 58 |
global _embedder, _chatbot_status
|
| 59 |
if _embedder is not None:
|
| 60 |
return _embedder
|
|
|
|
| 62 |
_chatbot_status["embedder"] = "unavailable"
|
| 63 |
return None
|
| 64 |
try:
|
| 65 |
+
print("[ClauseGuard Chat] Loading embedding model: BAAI/bge-small-en-v1.5...")
|
| 66 |
+
_embedder = SentenceTransformer("BAAI/bge-small-en-v1.5")
|
| 67 |
_chatbot_status["embedder"] = "loaded"
|
| 68 |
+
print("[ClauseGuard Chat] Embedding model loaded (BGE-small, 384-dim)")
|
| 69 |
return _embedder
|
| 70 |
except Exception as e:
|
| 71 |
_chatbot_status["embedder"] = f"failed: {e}"
|
|
|
|
| 196 |
return []
|
| 197 |
|
| 198 |
try:
|
| 199 |
+
# PERF v4.3: BGE models require query instruction prefix for retrieval
|
| 200 |
+
_BGE_QUERY_PREFIX = "Represent this sentence for searching relevant passages: "
|
| 201 |
+
q_emb = embedder.encode([_BGE_QUERY_PREFIX + query], normalize_embeddings=True)
|
| 202 |
scores = (q_emb @ embeddings.T)[0]
|
| 203 |
top_indices = np.argsort(scores)[::-1][:top_k]
|
| 204 |
|