gaurv007 commited on
Commit
21788a8
·
verified ·
1 Parent(s): 2035652

v4.3 perf: Update chatbot.py

Browse files
Files changed (1) hide show
  1. chatbot.py +9 -5
chatbot.py CHANGED
@@ -52,7 +52,9 @@ except ImportError:
52
  _chatbot_status = {"embedder": "not_loaded", "llm": "not_loaded"}
53
 
54
  def _load_embedder():
55
- """Load sentence-transformers embedding model (lazy)."""
 
 
56
  global _embedder, _chatbot_status
57
  if _embedder is not None:
58
  return _embedder
@@ -60,10 +62,10 @@ def _load_embedder():
60
  _chatbot_status["embedder"] = "unavailable"
61
  return None
62
  try:
63
- print("[ClauseGuard Chat] Loading embedding model: all-MiniLM-L6-v2...")
64
- _embedder = SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")
65
  _chatbot_status["embedder"] = "loaded"
66
- print("[ClauseGuard Chat] Embedding model loaded")
67
  return _embedder
68
  except Exception as e:
69
  _chatbot_status["embedder"] = f"failed: {e}"
@@ -194,7 +196,9 @@ def retrieve_chunks(query, chunks, embeddings, top_k=5):
194
  return []
195
 
196
  try:
197
- q_emb = embedder.encode([query], normalize_embeddings=True)
 
 
198
  scores = (q_emb @ embeddings.T)[0]
199
  top_indices = np.argsort(scores)[::-1][:top_k]
200
 
 
52
  _chatbot_status = {"embedder": "not_loaded", "llm": "not_loaded"}
53
 
54
  def _load_embedder():
55
+ """Load sentence-transformers embedding model (lazy).
56
+ PERF v4.3: Upgraded from all-MiniLM-L6-v2 to BAAI/bge-small-en-v1.5
57
+ (+21% MTEB retrieval accuracy, same 384-dim, same latency)."""
58
  global _embedder, _chatbot_status
59
  if _embedder is not None:
60
  return _embedder
 
62
  _chatbot_status["embedder"] = "unavailable"
63
  return None
64
  try:
65
+ print("[ClauseGuard Chat] Loading embedding model: BAAI/bge-small-en-v1.5...")
66
+ _embedder = SentenceTransformer("BAAI/bge-small-en-v1.5")
67
  _chatbot_status["embedder"] = "loaded"
68
+ print("[ClauseGuard Chat] Embedding model loaded (BGE-small, 384-dim)")
69
  return _embedder
70
  except Exception as e:
71
  _chatbot_status["embedder"] = f"failed: {e}"
 
196
  return []
197
 
198
  try:
199
+ # PERF v4.3: BGE models require query instruction prefix for retrieval
200
+ _BGE_QUERY_PREFIX = "Represent this sentence for searching relevant passages: "
201
+ q_emb = embedder.encode([_BGE_QUERY_PREFIX + query], normalize_embeddings=True)
202
  scores = (q_emb @ embeddings.T)[0]
203
  top_indices = np.argsort(scores)[::-1][:top_k]
204