Sazzz02 commited on
Commit
69f23de
·
verified ·
1 Parent(s): 80a7c7d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -10
app.py CHANGED
@@ -3,7 +3,7 @@ import os
3
  import PyPDF2
4
  import docx
5
  from langchain.text_splitter import RecursiveCharacterTextSplitter
6
- from langchain_cohere import CohereEmbeddings
7
  from langchain_community.vectorstores import Chroma
8
  from groq import Groq
9
  from langchain_core.prompts import PromptTemplate
@@ -18,15 +18,8 @@ from datetime import datetime
18
 
19
  class DocumentProcessor:
20
  def __init__(self):
21
- # Using CohereEmbeddings for document processing.
22
- # Ensure 'COHERE_API_KEY' and 'GROQ_API_KEY' are set as secrets in Hugging Face.
23
- if "COHERE_API_KEY" not in os.environ:
24
- st.error("Cohere API key is required for document processing.")
25
- st.stop()
26
- self.embeddings = CohereEmbeddings(
27
- cohere_api_key=os.environ["COHERE_API_KEY"],
28
- model="embed-english-v3.0" # Specify the Cohere embedding model
29
- )
30
  self.text_splitter = RecursiveCharacterTextSplitter(
31
  chunk_size=1000,
32
  chunk_overlap=200
 
3
  import PyPDF2
4
  import docx
5
  from langchain.text_splitter import RecursiveCharacterTextSplitter
6
+ from langchain_community.embeddings import HuggingFaceEmbeddings # Use HuggingFaceEmbeddings
7
  from langchain_community.vectorstores import Chroma
8
  from groq import Groq
9
  from langchain_core.prompts import PromptTemplate
 
18
 
19
  class DocumentProcessor:
20
  def __init__(self):
21
+ # Use a free Hugging Face model for embeddings
22
+ self.embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
 
 
 
 
 
 
 
23
  self.text_splitter = RecursiveCharacterTextSplitter(
24
  chunk_size=1000,
25
  chunk_overlap=200