feat(rag): add fastembed/faiss-cpu/pypdf for retrieval layer
Browse files- .gitignore +7 -0
- requirements.txt +5 -0
.gitignore
CHANGED
|
@@ -34,3 +34,10 @@ mlartifacts/
|
|
| 34 |
.idea/
|
| 35 |
.vscode/
|
| 36 |
.DS_Store
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 34 |
.idea/
|
| 35 |
.vscode/
|
| 36 |
.DS_Store
|
| 37 |
+
|
| 38 |
+
# RAG knowledge base (user-supplied PDFs/MD; not source-controlled)
|
| 39 |
+
data/knowledge_base/*.pdf
|
| 40 |
+
data/knowledge_base/*.PDF
|
| 41 |
+
|
| 42 |
+
# RAG built artifacts
|
| 43 |
+
data/processed/faiss_index/
|
requirements.txt
CHANGED
|
@@ -37,6 +37,11 @@ pytest==8.3.3
|
|
| 37 |
pytest-cov==5.0.0
|
| 38 |
httpx==0.27.2 # FastAPI test client
|
| 39 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 40 |
# --- Frontend (B2B dashboard) ---
|
| 41 |
streamlit==1.39.0
|
| 42 |
|
|
|
|
| 37 |
pytest-cov==5.0.0
|
| 38 |
httpx==0.27.2 # FastAPI test client
|
| 39 |
|
| 40 |
+
# --- RAG (knowledge retrieval for agent feedback loop) ---
|
| 41 |
+
fastembed==0.4.2 # ONNX-based embeddings, no torch dep
|
| 42 |
+
faiss-cpu==1.8.0 # vector store
|
| 43 |
+
pypdf==5.0.1 # PDF text extraction
|
| 44 |
+
|
| 45 |
# --- Frontend (B2B dashboard) ---
|
| 46 |
streamlit==1.39.0
|
| 47 |
|