Spaces:

lvizcaya
/

research_agent

Sleeping

App Files Files Community

Luis Vizcaya commited on Jan 4

Commit

b95f82b

1 Parent(s): 27827fb

requirements.txt updated

Browse files

Files changed (2) hide show

app.py +36 -29
requirements.txt +160 -9

app.py CHANGED Viewed

@@ -6,6 +6,15 @@ import time
 from typing import List, Dict, Generator
 from dotenv import load_dotenv
 # Import our agents from the src directory
 from src.clarifier import Clarifier
 from src.planner import Planner
@@ -18,7 +27,8 @@ load_dotenv()
 def get_secret(key):
     val = os.getenv(key)
-    return val if val is not None else ""
 HF_KEY = get_secret("HF_KEY")
 TAVILY_API_KEY = get_secret("TAVILY_API_KEY")
@@ -28,8 +38,8 @@ logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(
 logger = logging.getLogger(__name__)
 # --- MODELS ---
-# Using the most stable serverless models to avoid 401 router issues
-CLARIFIER_MODEL = 'Qwen/Qwen2.5-7B-Instruct'
 PLANNER_MODEL = 'Qwen/Qwen2.5-7B-Instruct'
 SPLITTER_MODEL = 'Qwen/Qwen2.5-7B-Instruct'
 COORDINATOR_MODEL = 'Qwen/Qwen2.5-7B-Instruct'
@@ -47,17 +57,19 @@ theme = gr.themes.Soft(
 def start_clarification(topic, hf_key, state):
     if not topic:
         return gr.update(), "### ⚠️ Warning\nPlease enter a topic.", state, gr.update()
-    if not hf_key or hf_key.strip() == "":
-        return gr.update(), "### ⚠️ Warning\nPlease provide a valid Hugging Face Token in the configuration panel.", state, gr.update()
     state["initial_topic"] = topic
-    clarifier = Clarifier(model_name=CLARIFIER_MODEL, hf_key=hf_key.strip())
     try:
         suggestions = clarifier.get_suggestions(topic)
         state["suggestions"] = suggestions
         if not suggestions:
-            return gr.update(), "### ❌ Error\nNo suggestions received. Please check if your HF Token has access to the models.", state, gr.update()
         suggestion_md = "### 💡 Refine Your Topic\n\nChoose one of the suggested directions or enter a custom one below:\n\n"
         for i, s in enumerate(suggestions):
@@ -67,7 +79,7 @@ def start_clarification(topic, hf_key, state):
     except Exception as e:
         error_msg = str(e)
         if "401" in error_msg:
-            error_msg = "401 Unauthorized: Your Hugging Face Token is invalid or doesn't have permissions for the Inference API."
         return gr.update(), f"### ❌ Error\n{error_msg}", state, gr.update()
 def select_suggestion(index, custom_topic, state):
@@ -77,17 +89,16 @@ def select_suggestion(index, custom_topic, state):
         sug = state["suggestions"][int(index)-1]
         state["final_topic"] = f"{sug['title']}: {sug['description']}"
     else:
-        # ENSURE 4 ITEMS ARE RETURNED
         return gr.update(), "### ⚠️ Warning\nPlease select an option or enter a custom topic.", state, gr.update()
     return gr.update(visible=True), f"### 🎯 Target Topic\n**{state['final_topic']}**", state, gr.update(visible=False)
 def generate_strategy(hf_key, state):
-    hf_key = hf_key.strip()
-    if not hf_key:
         return "### ⚠️ Warning\nHF Key missing.", state, gr.update()
-    planner = Planner(model_name=PLANNER_MODEL, hf_key=hf_key)
     try:
         plan = planner.plan(state["final_topic"])
         state["research_plan"] = plan
@@ -96,11 +107,11 @@ def generate_strategy(hf_key, state):
         return f"### ❌ Error\n{str(e)}", state, gr.update()
 def decompose_tasks(hf_key, state):
-    hf_key = hf_key.strip()
-    if not hf_key:
         return "### ⚠️ Warning\nHF Key missing.", state, gr.update()
-    splitter = Splitter(model_name=SPLITTER_MODEL, hf_key=hf_key)
     try:
         subtasks = splitter.split(state["research_plan"])
         state["subtasks"] = subtasks
@@ -118,23 +129,22 @@ def run_research(hf_key, tavily_key, state):
     from src.prompts import SUBAGENT_DIRECTION, COORDINATOR_DIRECTION
     from tavily import TavilyClient
-    hf_key = hf_key.strip()
-    tavily_key = tavily_key.strip()
-    if not hf_key:
         yield "### ❌ Error\nHF Token missing.", state, gr.update(), ""
         return
-    if not tavily_key:
         yield "### ❌ Error\nTavily API Key missing.", state, gr.update(), ""
         return
-    tavily_client = TavilyClient(api_key=tavily_key)
     @tool
     def web_search(query: str) -> str:
         """
         Search the web for real-time information using Tavily.
         Args:
             query: The search query to look up.
         """
@@ -146,8 +156,8 @@ def run_research(hf_key, tavily_key, state):
         except Exception as e:
             return f"Search failed: {e}"
-    coordinator_model = InferenceClientModel(model_id=COORDINATOR_MODEL, api_key=hf_key)
-    subagent_model = InferenceClientModel(model_id=SUBAGENT_MODEL, api_key=hf_key)
     current_findings = []
     log_content = "### 🔍 Agentic Research Progress\n\n"
@@ -162,7 +172,7 @@ def run_research(hf_key, tavily_key, state):
         t_title = task['title']
         t_desc = task['description']
-        log_content += f"**Agent working on:** {t_title}...\n"
         yield log_content, state, gr.update(), ""
         subagent = CodeAgent(
@@ -206,14 +216,11 @@ def run_research(hf_key, tavily_key, state):
         final_report = response.content
         if "<think>" in final_report and "</think>" in final_report:
             final_report = final_report.split("</think>")[-1].strip()
-        elif "<think>" in final_report:
-            final_report = final_report.split("<think>")[-1].strip()
-            if "\n\n" in final_report: final_report = final_report.split("\n\n", 1)[-1]
         log_content += "### 🖋️ Review: Polishing and Finalizing...\n"
         yield log_content, state, gr.update(), ""
-        reviewer = Reviewer(model_name=REVIEWER_MODEL, hf_key=hf_key)
         polished_report = reviewer.review(final_report)
         state["final_report"] = polished_report
@@ -265,7 +272,7 @@ with gr.Blocks(theme=theme, title="Deep Research Agent") as demo:
             # STEP 1: Introduction
             with gr.Column(visible=True) as step1_col:
                 gr.Markdown("## 1️⃣ What are you researching?")
-                topic_input = gr.Textbox(label="Enter a broad topic or research question:", placeholder="e.g., Future of Fusion Energy")
                 start_btn = gr.Button("Clarify Topic ➡️", variant="primary")
             # STEP 2: Refinement

 from typing import List, Dict, Generator
 from dotenv import load_dotenv
+# Try to use truststore for corporate network compatibility (local only)
+if not os.getenv("SPACE_ID"):
+    try:
+        import truststore
+        truststore.inject_into_ssl()
+        print("💡 Truststore injected (Corporate SSL mode)")
+    except ImportError:
+        pass
 # Import our agents from the src directory
 from src.clarifier import Clarifier
 from src.planner import Planner
 def get_secret(key):
     val = os.getenv(key)
+    # Strip spaces in case the .env has "KEY = VALUE"
+    return val.strip() if val is not None else ""
 HF_KEY = get_secret("HF_KEY")
 TAVILY_API_KEY = get_secret("TAVILY_API_KEY")
 logger = logging.getLogger(__name__)
 # --- MODELS ---
+# Using highly stable serverless models
+CLARIFIER_MODEL = 'HuggingFaceH4/zephyr-7b-beta'
 PLANNER_MODEL = 'Qwen/Qwen2.5-7B-Instruct'
 SPLITTER_MODEL = 'Qwen/Qwen2.5-7B-Instruct'
 COORDINATOR_MODEL = 'Qwen/Qwen2.5-7B-Instruct'
 def start_clarification(topic, hf_key, state):
     if not topic:
         return gr.update(), "### ⚠️ Warning\nPlease enter a topic.", state, gr.update()
+    clean_key = hf_key.strip() if hf_key else ""
+    if not clean_key:
+        return gr.update(), "### ⚠️ Warning\nPlease provide a valid Hugging Face Token.", state, gr.update()
     state["initial_topic"] = topic
+    clarifier = Clarifier(model_name=CLARIFIER_MODEL, hf_key=clean_key)
     try:
         suggestions = clarifier.get_suggestions(topic)
         state["suggestions"] = suggestions
         if not suggestions:
+            return gr.update(), "### ❌ Error\nNo suggestions received. This usually means the HF Token is invalid or the model is overloaded.", state, gr.update()
         suggestion_md = "### 💡 Refine Your Topic\n\nChoose one of the suggested directions or enter a custom one below:\n\n"
         for i, s in enumerate(suggestions):
     except Exception as e:
         error_msg = str(e)
         if "401" in error_msg:
+            error_msg = "401 Unauthorized: Your Hugging Face Token is invalid for the Inference API. Please generate a new 'Write' token at hf.co/settings/tokens"
         return gr.update(), f"### ❌ Error\n{error_msg}", state, gr.update()
 def select_suggestion(index, custom_topic, state):
         sug = state["suggestions"][int(index)-1]
         state["final_topic"] = f"{sug['title']}: {sug['description']}"
     else:
         return gr.update(), "### ⚠️ Warning\nPlease select an option or enter a custom topic.", state, gr.update()
     return gr.update(visible=True), f"### 🎯 Target Topic\n**{state['final_topic']}**", state, gr.update(visible=False)
 def generate_strategy(hf_key, state):
+    clean_key = hf_key.strip() if hf_key else ""
+    if not clean_key:
         return "### ⚠️ Warning\nHF Key missing.", state, gr.update()
+    planner = Planner(model_name=PLANNER_MODEL, hf_key=clean_key)
     try:
         plan = planner.plan(state["final_topic"])
         state["research_plan"] = plan
         return f"### ❌ Error\n{str(e)}", state, gr.update()
 def decompose_tasks(hf_key, state):
+    clean_key = hf_key.strip() if hf_key else ""
+    if not clean_key:
         return "### ⚠️ Warning\nHF Key missing.", state, gr.update()
+    splitter = Splitter(model_name=SPLITTER_MODEL, hf_key=clean_key)
     try:
         subtasks = splitter.split(state["research_plan"])
         state["subtasks"] = subtasks
     from src.prompts import SUBAGENT_DIRECTION, COORDINATOR_DIRECTION
     from tavily import TavilyClient
+    clean_hf = hf_key.strip() if hf_key else ""
+    clean_tavily = tavily_key.strip() if tavily_key else ""
+    if not clean_hf:
         yield "### ❌ Error\nHF Token missing.", state, gr.update(), ""
         return
+    if not clean_tavily:
         yield "### ❌ Error\nTavily API Key missing.", state, gr.update(), ""
         return
+    tavily_client = TavilyClient(api_key=clean_tavily)
     @tool
     def web_search(query: str) -> str:
         """
         Search the web for real-time information using Tavily.
         Args:
             query: The search query to look up.
         """
         except Exception as e:
             return f"Search failed: {e}"
+    coordinator_model = InferenceClientModel(model_id=COORDINATOR_MODEL, api_key=clean_hf)
+    subagent_model = InferenceClientModel(model_id=SUBAGENT_MODEL, api_key=clean_hf)
     current_findings = []
     log_content = "### 🔍 Agentic Research Progress\n\n"
         t_title = task['title']
         t_desc = task['description']
+        log_content += f"**Agent {i+1} working on:** {t_title}...\n"
         yield log_content, state, gr.update(), ""
         subagent = CodeAgent(
         final_report = response.content
         if "<think>" in final_report and "</think>" in final_report:
             final_report = final_report.split("</think>")[-1].strip()
         log_content += "### 🖋️ Review: Polishing and Finalizing...\n"
         yield log_content, state, gr.update(), ""
+        reviewer = Reviewer(model_name=REVIEWER_MODEL, hf_key=clean_hf)
         polished_report = reviewer.review(final_report)
         state["final_report"] = polished_report
             # STEP 1: Introduction
             with gr.Column(visible=True) as step1_col:
                 gr.Markdown("## 1️⃣ What are you researching?")
+                topic_input = gr.Textbox(label="Enter a broad topic or research question:", placeholder="e.g., Target market for sustainable polymers in Europe")
                 start_btn = gr.Button("Clarify Topic ➡️", variant="primary")
             # STEP 2: Refinement

requirements.txt CHANGED Viewed

@@ -1,9 +1,160 @@
-huggingface_hub
-gradio
-python-dotenv
-pydantic
-smolagents
-tavily-python
-requests
-certifi
-fpdf2

+aiofiles==24.1.0
+altair==5.5.0
+altgraph==0.17.5
+annotated-doc==0.0.4
+annotated-types==0.7.0
+anyio==4.9.0
+asttokens==3.0.0
+attrs==25.3.0
+audioop-lts==0.2.2
+azure-core==1.35.0
+azure-identity==1.23.0
+blinker==1.9.0
+brotli==1.2.0
+cachetools==6.1.0
+certifi==2025.8.3
+cffi==1.17.1
+charset-normalizer==3.4.2
+click==8.2.1
+cloudpickle==3.1.1
+colorama==0.4.6
+comm==0.2.3
+contourpy==1.3.2
+cryptography==45.0.5
+cycler==0.12.1
+debugpy==1.8.16
+decorator==5.2.1
+distlib==0.4.0
+distro==1.9.0
+exceptiongroup==1.3.0
+executing==2.2.0
+Farama-Notifications==0.0.4
+fastapi==0.128.0
+fastjsonschema==2.21.2
+ffmpy==1.0.0
+filelock==3.19.1
+fonttools==4.59.0
+fsspec==2025.12.0
+gitdb==4.0.12
+GitPython==3.1.44
+gradio==6.2.0
+gradio_client==2.0.2
+greenlet==3.3.0
+groovy==0.1.2
+gymnasium==1.1.1
+h11==0.16.0
+hf-xet==1.2.0
+holidays==0.78
+httpcore==1.0.9
+httpx==0.28.1
+httpx-sse==0.4.1
+huggingface_hub==1.2.3
+idna==3.10
+ipykernel==6.30.1
+ipython==8.37.0
+ipython_pygments_lexers==1.1.1
+jedi==0.19.2
+Jinja2==3.1.6
+jiter==0.10.0
+joblib==1.5.1
+jsonschema==4.25.1
+jsonschema-specifications==2025.9.1
+jupyter_client==8.6.3
+jupyter_core==5.8.1
+kiwisolver==1.4.8
+llvmlite==0.44.0
+logging==0.4.9.6
+markdown-it-py==3.0.0
+MarkupSafe==3.0.2
+matplotlib==3.10.5
+matplotlib-inline==0.1.7
+mcp==1.11.0
+mdurl==0.1.2
+msal==1.32.3
+msal-extensions==1.3.1
+narwhals==2.4.0
+nbformat==5.10.4
+nest-asyncio==1.6.0
+networkx==3.4.2
+numba==0.61.2
+numpy==2.2.6
+openai==1.90.0
+orjson==3.11.5
+packaging==25.0
+pandas==2.3.1
+parso==0.8.5
+patsy==1.0.1
+pefile==2024.8.26
+pillow==11.3.0
+platformdirs==4.3.8
+plotly==6.3.0
+prompt_toolkit==3.0.51
+protobuf==6.31.1
+psutil==7.0.0
+PuLP==3.2.2
+pure_eval==0.2.3
+pyarrow==20.0.0
+pycparser==2.22
+pydantic==2.11.7
+pydantic-settings==2.10.1
+pydantic_core==2.33.2
+pydeck==0.9.1
+pydub==0.25.1
+pyenv-win==3.1.1
+Pygments==2.19.2
+pyinstaller==6.17.0
+pyinstaller-hooks-contrib==2025.11
+PyJWT==2.10.1
+pyodbc==5.2.0
+pyparsing==3.2.3
+python-dateutil==2.9.0.post0
+python-dotenv==1.1.1
+python-multipart==0.0.20
+pytz==2025.2
+pywin32==311
+pywin32-ctypes==0.2.3
+PyYAML==6.0.3
+pyzmq==27.0.2
+referencing==0.36.2
+requests==2.32.4
+rich==14.1.0
+rpds-py==0.27.1
+safehttpx==0.1.7
+scikit-learn==1.7.1
+scipy==1.15.3
+semantic-version==2.10.0
+setuptools==80.9.0
+shap==0.48.0
+shellingham==1.5.4
+six==1.17.0
+slicer==0.0.8
+smmap==5.0.2
+sniffio==1.3.1
+SQLAlchemy==2.0.45
+sse-starlette==2.4.1
+stack-data==0.6.3
+starlette==0.47.1
+statsmodels==0.14.5
+streamlit==1.46.0
+tabulate==0.9.0
+tenacity==9.1.2
+termcolor==3.1.0
+threadpoolctl==3.6.0
+toml==0.10.2
+tomlkit==0.13.3
+tornado==6.5.2
+tqdm==4.67.1
+traitlets==5.14.3
+truststore==0.10.4
+typer==0.21.0
+typer-slim==0.21.0
+typing-inspection==0.4.1
+typing_extensions==4.14.1
+tzdata==2025.2
+urllib3==2.5.0
+uv==0.7.20
+uvicorn==0.35.0
+virtualenv==20.34.0
+watchdog==6.0.0
+wcwidth==0.2.13
+xgboost==3.0.4