mohantest commited on
Commit
a2f1bed
·
verified ·
1 Parent(s): 4de1201

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +184 -105
app.py CHANGED
@@ -1,115 +1,194 @@
1
- import logging
2
- import hashlib
3
- import json
4
  import os
5
- from smolagents import CodeAgent, tool
6
- from huggingface_hub import InferenceClient
7
-
8
- logging.basicConfig(level=logging.INFO)
9
- logger = logging.getLogger(__name__)
10
-
11
- # Cache for answers
12
- CACHE_FILE = "answer_cache.json"
13
- if os.path.exists(CACHE_FILE):
14
- with open(CACHE_FILE) as f:
15
- answer_cache = json.load(f)
16
- else:
17
- answer_cache = {}
18
-
19
- def save_cache():
20
- with open(CACHE_FILE, "w") as f:
21
- json.dump(answer_cache, f)
22
-
23
- # ---------- Tools ----------
24
- @tool
25
- def calculator(expression: str) -> str:
26
  """
27
- Safely evaluate a mathematical expression.
28
-
29
- Args:
30
- expression: A string containing a simple arithmetic expression (e.g., '2 + 2').
31
-
32
- Returns:
33
- The result as a string, or an error message if the expression is invalid.
34
  """
35
- allowed_chars = set("0123456789+-*/(). ")
36
- if not all(c in allowed_chars for c in expression):
37
- return "Error: Expression contains disallowed characters."
38
- try:
39
- result = eval(expression, {"__builtins__": {}}, {})
40
- return str(result)
41
- except Exception as e:
42
- return f"Error: {e}"
43
 
44
- @tool
45
- def web_search(query: str) -> str:
46
- """
47
- Search the web for up-to-date information.
 
 
48
 
49
- Args:
50
- query: The search query string.
 
51
 
52
- Returns:
53
- A string containing up to three search result snippets with titles and URLs,
54
- or an error message if the search fails.
55
- """
56
  try:
57
- from duckduckgo_search import DDGS
58
- with DDGS() as ddgs:
59
- results = list(ddgs.text(query, max_results=3))
60
- if not results:
61
- return "No results found."
62
- snippets = []
63
- for r in results:
64
- snippets.append(f"Title: {r['title']}\nBody: {r['body']}\nURL: {r['href']}")
65
- return "\n\n".join(snippets)
66
- except ImportError:
67
- return "Web search tool not available: install duckduckgo-search"
68
  except Exception as e:
69
- return f"Search error: {e}"
70
-
71
- # ---------- Custom model ----------
72
- class CustomHFModel:
73
- def __init__(self, model_id="HuggingFaceH4/zephyr-7b-beta"):
74
- self.client = InferenceClient(model=model_id, token=os.getenv("HF_TOKEN"))
75
- self.model_id = model_id
76
-
77
- def __call__(self, messages, **kwargs):
78
- response = self.client.chat_completion(
79
- messages=messages,
80
- max_tokens=500,
81
- temperature=0.7,
82
- **kwargs
83
- )
84
- return response.choices[0].message.content
85
-
86
- # ---------- Assemble agent ----------
87
- tools = [calculator]
88
- try:
89
- import duckduckgo_search
90
- tools.append(web_search)
91
- logger.info("Web search tool enabled.")
92
- except ImportError:
93
- logger.warning("duckduckgo-search not installed, web_search disabled.")
94
-
95
- model = CustomHFModel()
96
- agent = CodeAgent(tools=tools, model=model)
97
-
98
- # ---------- Main entry point (called by app.py) ----------
99
- def solve(question: str) -> str:
100
- """This function must be named 'solve' because app.py imports it."""
101
- q_hash = hashlib.md5(question.encode()).hexdigest()
102
- if q_hash in answer_cache:
103
- logger.info(f"Cache hit for question: {question[:50]}...")
104
- return answer_cache[q_hash]
105
-
106
- logger.info(f"Processing question: {question[:50]}...")
107
  try:
108
- answer = agent.run(question)
 
 
 
 
 
 
 
 
 
 
 
 
 
109
  except Exception as e:
110
- logger.error(f"Agent error: {e}")
111
- answer = f"Error: {e}"
112
-
113
- answer_cache[q_hash] = answer
114
- save_cache()
115
- return answer
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  import os
2
+ import gradio as gr
3
+ import requests
4
+ import inspect
5
+ import pandas as pd
6
+
7
+ # (Keep Constants as is)
8
+ # --- Constants ---
9
+ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
10
+
11
+ # --- Basic Agent Definition ---
12
+ # ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
13
+ class BasicAgent:
14
+ def __init__(self):
15
+ print("BasicAgent initialized.")
16
+ def __call__(self, question: str) -> str:
17
+ print(f"Agent received question (first 50 chars): {question[:50]}...")
18
+ fixed_answer = "This is a default answer."
19
+ print(f"Agent returning fixed answer: {fixed_answer}")
20
+ return fixed_answer
21
+
22
+ def run_and_submit_all( profile: gr.OAuthProfile | None):
23
  """
24
+ Fetches all questions, runs the BasicAgent on them, submits all answers,
25
+ and displays the results.
 
 
 
 
 
26
  """
27
+ # --- Determine HF Space Runtime URL and Repo URL ---
28
+ space_id = os.getenv("SPACE_ID") # Get the SPACE_ID for sending link to the code
 
 
 
 
 
 
29
 
30
+ if profile:
31
+ username= f"{profile.username}"
32
+ print(f"User logged in: {username}")
33
+ else:
34
+ print("User not logged in.")
35
+ return "Please Login to Hugging Face with the button.", None
36
 
37
+ api_url = DEFAULT_API_URL
38
+ questions_url = f"{api_url}/questions"
39
+ submit_url = f"{api_url}/submit"
40
 
41
+ # 1. Instantiate Agent ( modify this part to create your agent)
 
 
 
42
  try:
43
+ agent = BasicAgent()
 
 
 
 
 
 
 
 
 
 
44
  except Exception as e:
45
+ print(f"Error instantiating agent: {e}")
46
+ return f"Error initializing agent: {e}", None
47
+ # In the case of an app running as a hugging Face space, this link points toward your codebase ( usefull for others so please keep it public)
48
+ agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
49
+ print(agent_code)
50
+
51
+ # 2. Fetch Questions
52
+ print(f"Fetching questions from: {questions_url}")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
53
  try:
54
+ response = requests.get(questions_url, timeout=15)
55
+ response.raise_for_status()
56
+ questions_data = response.json()
57
+ if not questions_data:
58
+ print("Fetched questions list is empty.")
59
+ return "Fetched questions list is empty or invalid format.", None
60
+ print(f"Fetched {len(questions_data)} questions.")
61
+ except requests.exceptions.RequestException as e:
62
+ print(f"Error fetching questions: {e}")
63
+ return f"Error fetching questions: {e}", None
64
+ except requests.exceptions.JSONDecodeError as e:
65
+ print(f"Error decoding JSON response from questions endpoint: {e}")
66
+ print(f"Response text: {response.text[:500]}")
67
+ return f"Error decoding server response for questions: {e}", None
68
  except Exception as e:
69
+ print(f"An unexpected error occurred fetching questions: {e}")
70
+ return f"An unexpected error occurred fetching questions: {e}", None
71
+
72
+ # 3. Run your Agent
73
+ results_log = []
74
+ answers_payload = []
75
+ print(f"Running agent on {len(questions_data)} questions...")
76
+ for item in questions_data:
77
+ task_id = item.get("task_id")
78
+ question_text = item.get("question")
79
+ if not task_id or question_text is None:
80
+ print(f"Skipping item with missing task_id or question: {item}")
81
+ continue
82
+ try:
83
+ submitted_answer = agent(question_text)
84
+ answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
85
+ results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
86
+ except Exception as e:
87
+ print(f"Error running agent on task {task_id}: {e}")
88
+ results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
89
+
90
+ if not answers_payload:
91
+ print("Agent did not produce any answers to submit.")
92
+ return "Agent did not produce any answers to submit.", pd.DataFrame(results_log)
93
+
94
+ # 4. Prepare Submission
95
+ submission_data = {"username": username.strip(), "agent_code": agent_code, "answers": answers_payload}
96
+ status_update = f"Agent finished. Submitting {len(answers_payload)} answers for user '{username}'..."
97
+ print(status_update)
98
+
99
+ # 5. Submit
100
+ print(f"Submitting {len(answers_payload)} answers to: {submit_url}")
101
+ try:
102
+ response = requests.post(submit_url, json=submission_data, timeout=60)
103
+ response.raise_for_status()
104
+ result_data = response.json()
105
+ final_status = (
106
+ f"Submission Successful!\n"
107
+ f"User: {result_data.get('username')}\n"
108
+ f"Overall Score: {result_data.get('score', 'N/A')}% "
109
+ f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
110
+ f"Message: {result_data.get('message', 'No message received.')}"
111
+ )
112
+ print("Submission successful.")
113
+ results_df = pd.DataFrame(results_log)
114
+ return final_status, results_df
115
+ except requests.exceptions.HTTPError as e:
116
+ error_detail = f"Server responded with status {e.response.status_code}."
117
+ try:
118
+ error_json = e.response.json()
119
+ error_detail += f" Detail: {error_json.get('detail', e.response.text)}"
120
+ except requests.exceptions.JSONDecodeError:
121
+ error_detail += f" Response: {e.response.text[:500]}"
122
+ status_message = f"Submission Failed: {error_detail}"
123
+ print(status_message)
124
+ results_df = pd.DataFrame(results_log)
125
+ return status_message, results_df
126
+ except requests.exceptions.Timeout:
127
+ status_message = "Submission Failed: The request timed out."
128
+ print(status_message)
129
+ results_df = pd.DataFrame(results_log)
130
+ return status_message, results_df
131
+ except requests.exceptions.RequestException as e:
132
+ status_message = f"Submission Failed: Network error - {e}"
133
+ print(status_message)
134
+ results_df = pd.DataFrame(results_log)
135
+ return status_message, results_df
136
+ except Exception as e:
137
+ status_message = f"An unexpected error occurred during submission: {e}"
138
+ print(status_message)
139
+ results_df = pd.DataFrame(results_log)
140
+ return status_message, results_df
141
+
142
+
143
+ # --- Build Gradio Interface using Blocks ---
144
+ with gr.Blocks() as demo:
145
+ gr.Markdown("# Basic Agent Evaluation Runner")
146
+ gr.Markdown(
147
+ """
148
+ **Instructions:**
149
+ 1. Please clone this space, then modify the code to define your agent's logic, the tools, the necessary packages, etc ...
150
+ 2. Log in to your Hugging Face account using the button below. This uses your HF username for submission.
151
+ 3. Click 'Run Evaluation & Submit All Answers' to fetch questions, run your agent, submit answers, and see the score.
152
+ ---
153
+ **Disclaimers:**
154
+ Once clicking on the "submit button, it can take quite some time ( this is the time for the agent to go through all the questions).
155
+ This space provides a basic setup and is intentionally sub-optimal to encourage you to develop your own, more robust solution. For instance for the delay process of the submit button, a solution could be to cache the answers and submit in a seperate action or even to answer the questions in async.
156
+ """
157
+ )
158
+
159
+ gr.LoginButton()
160
+
161
+ run_button = gr.Button("Run Evaluation & Submit All Answers")
162
+
163
+ status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
164
+ # Removed max_rows=10 from DataFrame constructor
165
+ results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
166
+
167
+ run_button.click(
168
+ fn=run_and_submit_all,
169
+ outputs=[status_output, results_table]
170
+ )
171
+
172
+ if __name__ == "__main__":
173
+ print("\n" + "-"*30 + " App Starting " + "-"*30)
174
+ # Check for SPACE_HOST and SPACE_ID at startup for information
175
+ space_host_startup = os.getenv("SPACE_HOST")
176
+ space_id_startup = os.getenv("SPACE_ID") # Get SPACE_ID at startup
177
+
178
+ if space_host_startup:
179
+ print(f"✅ SPACE_HOST found: {space_host_startup}")
180
+ print(f" Runtime URL should be: https://{space_host_startup}.hf.space")
181
+ else:
182
+ print("ℹ️ SPACE_HOST environment variable not found (running locally?).")
183
+
184
+ if space_id_startup: # Print repo URLs if SPACE_ID is found
185
+ print(f"✅ SPACE_ID found: {space_id_startup}")
186
+ print(f" Repo URL: https://huggingface.co/spaces/{space_id_startup}")
187
+ print(f" Repo Tree URL: https://huggingface.co/spaces/{space_id_startup}/tree/main")
188
+ else:
189
+ print("ℹ️ SPACE_ID environment variable not found (running locally?). Repo URL cannot be determined.")
190
+
191
+ print("-"*(60 + len(" App Starting ")) + "\n")
192
+
193
+ print("Launching Gradio Interface for Basic Agent Evaluation...")
194
+ demo.launch(debug=True, share=False)