Spaces:

httpdaniel
/

TalkToDocuments

Sleeping

App Files Files Community

httpdaniel commited on Aug 27, 2024

Commit

90231c1

1 Parent(s): 3a8a9b9

Updating UI

Browse files

Files changed (1) hide show

app.py +22 -58

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from langchain_core.prompts import ChatPromptTemplate
 from langchain.chains.combine_documents import create_stuff_documents_chain
 from langchain.chains import create_retrieval_chain
-def initialise_vectorstore(pdf, progress=gr.Progress()):
     progress(0, desc="Reading PDF")
     loader = PyPDFLoader(pdf.name)
@@ -16,27 +16,21 @@ def initialise_vectorstore(pdf, progress=gr.Progress()):
     text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
     splits = text_splitter.split_documents(pages)
-    progress(0.5, desc="Initialising Vectorstore")
     vectorstore = Chroma.from_documents(
         splits,
         embedding=HuggingFaceEmbeddings()
     )
-    progress(1, desc="Complete")
-    return vectorstore, progress
-def initialise_chain(llm, vectorstore, progress=gr.Progress()):
-    progress(0, desc="Initialising LLM")
     llm = HuggingFaceEndpoint(
         repo_id=llm,
         task="text-generation",
         max_new_tokens=512,
         top_k=4,
-        temperature=0.1
     )
     chat = ChatHuggingFace(
@@ -44,16 +38,14 @@ def initialise_chain(llm, vectorstore, progress=gr.Progress()):
         verbose=True
     )
-    progress(0.5, desc="Initialising RAG Chain")
-    retriever = vectorstore.as_retriever()
     system_prompt = (
         "You are an assistant for question-answering tasks. "
         "Use the following pieces of retrieved context to answer "
         "the question. If you don't know the answer, say that you "
-        "don't know. Use three sentences maximum and keep the "
-        "answer concise."
         "\n\n"
         "{context}"
     )
@@ -68,9 +60,7 @@ def initialise_chain(llm, vectorstore, progress=gr.Progress()):
     question_answer_chain = create_stuff_documents_chain(chat, prompt)
     rag_chain = create_retrieval_chain(retriever, question_answer_chain)
-    progress(0.9, desc="Complete")
-    return rag_chain, progress
 def send(message, rag_chain, chat_history):
     response = rag_chain.invoke({"input": message})
@@ -87,46 +77,20 @@ with gr.Blocks() as demo:
     gr.Markdown("<H3>Upload and ask questions about your PDF files</H3>")
     gr.Markdown("<H6>Note: This project uses LangChain to perform RAG (Retrieval Augmented Generation) on PDF files, allowing users to ask any questions related to their contents. When a PDF file is uploaded, it is embedded and stored in an in-memory Chroma vectorstore, which the chatbot uses as a source of knowledge when aswering user questions.</H6>")
-    with gr.Tab("Vectorstore"):
-        with gr.Row():
-            input_pdf = gr.File()
-        with gr.Row():
-            with gr.Column(scale=1, min_width=0):
-                pass
-            with gr.Column(scale=2, min_width=0):
-                initialise_vectorstore_btn = gr.Button(
-                    "Initialise Vectorstore",
-                    variant='primary'
-                )
-            with gr.Column(scale=1, min_width=0):
-                pass
-        with gr.Row():
-            vectorstore_initialisation_progress = gr.Textbox(value="None", label="Initialization")
-    with gr.Tab("RAG Chain"):
-        with gr.Row():
-            language_model = gr.Radio(["microsoft/Phi-3-mini-4k-instruct", "mistralai/Mistral-7B-Instruct-v0.2", "HuggingFaceH4/zephyr-7b-beta", "mistralai/Mixtral-8x7B-Instruct-v0.1"])
-        with gr.Row():
-            with gr.Column(scale=1, min_width=0):
-                pass
-            with gr.Column(scale=2, min_width=0):
-                initialise_chain_btn = gr.Button(
-                    "Initialise RAG Chain",
-                    variant='primary'
-                )
-            with gr.Column(scale=1, min_width=0):
-                pass
-        with gr.Row():
-            chain_initialisation_progress = gr.Textbox(value="None", label="Initialization")
-    with gr.Tab("Chatbot"):
-        with gr.Row():
-            chatbot = gr.Chatbot()
-        with gr.Row():
-            message = gr.Textbox()
-    initialise_vectorstore_btn.click(fn=initialise_vectorstore, inputs=input_pdf, outputs=[vectorstore, vectorstore_initialisation_progress])
-    initialise_chain_btn.click(fn=initialise_chain, inputs=[language_model, vectorstore], outputs=[rag_chain, chain_initialisation_progress])
     message.submit(fn=send, inputs=[message, rag_chain, chatbot], outputs=[message, chatbot])
 demo.launch()

 from langchain.chains.combine_documents import create_stuff_documents_chain
 from langchain.chains import create_retrieval_chain
+def initialise_chatbot(pdf, llm, progress=gr.Progress()):
     progress(0, desc="Reading PDF")
     loader = PyPDFLoader(pdf.name)
     text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
     splits = text_splitter.split_documents(pages)
+    progress(0.25, desc="Initialising Vectorstore")
     vectorstore = Chroma.from_documents(
         splits,
         embedding=HuggingFaceEmbeddings()
     )
+    progress(0.85, desc="Initialising LLM")
     llm = HuggingFaceEndpoint(
         repo_id=llm,
         task="text-generation",
         max_new_tokens=512,
         top_k=4,
+        temperature=0.05
     )
     chat = ChatHuggingFace(
         verbose=True
     )
+    retriever = vectorstore.as_retriever(search_kwargs={"k": 8})
     system_prompt = (
         "You are an assistant for question-answering tasks. "
         "Use the following pieces of retrieved context to answer "
         "the question. If you don't know the answer, say that you "
+        "don't know. Use two sentences maximum and keep the "
+        "answer concise and to the point."
         "\n\n"
         "{context}"
     )
     question_answer_chain = create_stuff_documents_chain(chat, prompt)
     rag_chain = create_retrieval_chain(retriever, question_answer_chain)
+    return rag_chain, "Complete!"
 def send(message, rag_chain, chat_history):
     response = rag_chain.invoke({"input": message})
     gr.Markdown("<H3>Upload and ask questions about your PDF files</H3>")
     gr.Markdown("<H6>Note: This project uses LangChain to perform RAG (Retrieval Augmented Generation) on PDF files, allowing users to ask any questions related to their contents. When a PDF file is uploaded, it is embedded and stored in an in-memory Chroma vectorstore, which the chatbot uses as a source of knowledge when aswering user questions.</H6>")
+    with gr.Row():
+        with gr.Column(scale=1):
+            input_pdf = gr.File(label="1. Upload PDF")
+            language_model = gr.Radio(label="2. Choose LLM", choices=["microsoft/Phi-3-mini-4k-instruct", "mistralai/Mistral-7B-Instruct-v0.2", "HuggingFaceH4/zephyr-7b-beta", "mistralai/Mixtral-8x7B-Instruct-v0.1"])
+            initialise_chatbot_btn = gr.Button(value="3. Initialise Chatbot", variant='primary')
+            chatbot_initialisation_progress = gr.Textbox(value="Not Started", label="Initialization Progress")
+        with gr.Column(scale=4):
+            chatbot = gr.Chatbot(scale=1)
+            message = gr.Textbox(label="4. Ask questions about your PDF")
+    initialise_chatbot_btn.click(
+        fn=initialise_chatbot, inputs=[input_pdf, language_model], outputs=[rag_chain, chatbot_initialisation_progress]
+    )
     message.submit(fn=send, inputs=[message, rag_chain, chatbot], outputs=[message, chatbot])
 demo.launch()