Spaces:

smolagents
/

ml-intern

Running on CPU Upgrade

App Files Files Community

akseljoonas HF Staff commited on Jan 7

Commit

89b1b00

1 Parent(s): 54196ee

removing extra prints

Browse files

Files changed (2) hide show

agent/core/tools.py +17 -10
agent/tools/docs_tools.py +0 -49

agent/core/tools.py CHANGED Viewed

@@ -132,11 +132,13 @@ class ToolRouter:
     async def register_mcp_tools(self) -> None:
         tools = await self.mcp_client.list_tools()
         for tool in tools:
             if tool.name in NOT_ALLOWED_TOOL_NAMES:
-                print(f"Skipping not MCP allowed tool: {tool.name}")
                 continue
-            print(f"MCP Tool: {tool.name}")
             self.register_tool(
                 ToolSpec(
                     name=tool.name,
@@ -145,6 +147,9 @@ class ToolRouter:
                     handler=None,
                 )
             )
     async def register_openapi_tool(self) -> None:
         """Register the OpenAPI search tool (requires async initialization)"""
@@ -153,8 +158,6 @@ class ToolRouter:
             search_openapi_handler,
         )
-        print("Registering OpenAPI search tool...")
         # Register search_hf_api_endpoints with dynamic spec
         openapi_spec = await _get_api_search_tool_spec()
         self.register_tool(
@@ -165,7 +168,7 @@ class ToolRouter:
                 handler=search_openapi_handler,
             )
         )
-        print(f"Registered: {openapi_spec['name']}")
     def get_tool_specs_for_llm(self) -> list[dict[str, Any]]:
         """Get tool specifications in OpenAI format"""
@@ -189,11 +192,13 @@ class ToolRouter:
             await self.mcp_client.initialize()
             await self.register_mcp_tools()
             self._mcp_initialized = True
-        print(f"MCP initialized: {self._mcp_initialized}")
         # Register OpenAPI tool (requires async initialization)
         await self.register_openapi_tool()
         return self
     async def __aexit__(self, exc_type, exc, tb) -> None:
@@ -237,11 +242,8 @@ class ToolRouter:
 def create_builtin_tools() -> list[ToolSpec]:
     """Create built-in tool specifications"""
-    print(
-        f"Creating built-in tools: {EXPLORE_HF_DOCS_TOOL_SPEC['name']}, {HF_DOCS_FETCH_TOOL_SPEC['name']}, {PLAN_TOOL_SPEC['name']}, {HF_JOBS_TOOL_SPEC['name']}, {PRIVATE_HF_REPO_TOOL_SPEC['name']}, {GITHUB_FIND_EXAMPLES_TOOL_SPEC['name']}, {GITHUB_LIST_REPOS_TOOL_SPEC['name']}, {GITHUB_READ_FILE_TOOL_SPEC['name']}"
-    )
     # in order of importance
-    return [
         # Documentation search tools
         ToolSpec(
             name=EXPLORE_HF_DOCS_TOOL_SPEC["name"],
@@ -308,3 +310,8 @@ def create_builtin_tools() -> list[ToolSpec]:
             handler=github_read_file_handler,
         ),
     ]

     async def register_mcp_tools(self) -> None:
         tools = await self.mcp_client.list_tools()
+        registered_names = []
+        skipped_count = 0
         for tool in tools:
             if tool.name in NOT_ALLOWED_TOOL_NAMES:
+                skipped_count += 1
                 continue
+            registered_names.append(tool.name)
             self.register_tool(
                 ToolSpec(
                     name=tool.name,
                     handler=None,
                 )
             )
+        print(
+            f"Loaded {len(registered_names)} MCP tools: {', '.join(registered_names)} ({skipped_count} disabled)"
+        )
     async def register_openapi_tool(self) -> None:
         """Register the OpenAPI search tool (requires async initialization)"""
             search_openapi_handler,
         )
         # Register search_hf_api_endpoints with dynamic spec
         openapi_spec = await _get_api_search_tool_spec()
         self.register_tool(
                 handler=search_openapi_handler,
             )
         )
+        print(f"Loaded OpenAPI search tool: {openapi_spec['name']}")
     def get_tool_specs_for_llm(self) -> list[dict[str, Any]]:
         """Get tool specifications in OpenAI format"""
             await self.mcp_client.initialize()
             await self.register_mcp_tools()
             self._mcp_initialized = True
         # Register OpenAPI tool (requires async initialization)
         await self.register_openapi_tool()
+        total_tools = len(self.tools)
+        print(f"\nAgent ready with {total_tools} tools total\n")
         return self
     async def __aexit__(self, exc_type, exc, tb) -> None:
 def create_builtin_tools() -> list[ToolSpec]:
     """Create built-in tool specifications"""
     # in order of importance
+    tools = [
         # Documentation search tools
         ToolSpec(
             name=EXPLORE_HF_DOCS_TOOL_SPEC["name"],
             handler=github_read_file_handler,
         ),
     ]
+    tool_names = ", ".join([t.name for t in tools])
+    print(f"Loaded {len(tools)} built-in tools: {tool_names}")
+    return tools

agent/tools/docs_tools.py CHANGED Viewed

@@ -5,7 +5,6 @@ Tools for exploring and fetching HuggingFace documentation and API specification
 import asyncio
 import os
-import time
 from typing import Any
 import httpx
@@ -21,21 +20,15 @@ async def _fetch_html_page(hf_token: str, endpoint: str) -> str:
     url = f"{base_url}/{endpoint}"
     headers = {"Authorization": f"Bearer {hf_token}"}
-    fetch_start = time.perf_counter()
     async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
         response = await client.get(url, headers=headers)
         response.raise_for_status()
-    fetch_time = time.perf_counter() - fetch_start
-    print(f"[DEBUG] _fetch_html_page: Fetched in {fetch_time:.2f}s")
     return response.text
 def _parse_sidebar_navigation(html_content: str) -> list[dict[str, str]]:
     """Parse the sidebar navigation and extract all links"""
-    parse_start = time.perf_counter()
     soup = BeautifulSoup(html_content, "html.parser")
     sidebar = soup.find("nav", class_=lambda x: x and "flex-auto" in x)
@@ -53,11 +46,6 @@ def _parse_sidebar_navigation(html_content: str) -> list[dict[str, str]]:
         page_url = f"https://huggingface.co{href}" if href.startswith("/") else href
         nav_data.append({"title": title, "url": page_url})
-    parse_time = time.perf_counter() - parse_start
-    print(
-        f"[DEBUG] _parse_sidebar_navigation: Parsed in {parse_time:.2f}s, found {len(nav_data)} links"
-    )
     return nav_data
@@ -96,18 +84,11 @@ async def _fetch_all_glimpses(
     hf_token: str, nav_data: list[dict[str, str]]
 ) -> list[dict[str, str]]:
     """Fetch glimpses for all pages in parallel"""
-    glimpse_start = time.perf_counter()
     async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
         result_items = await asyncio.gather(
             *[_fetch_single_glimpse(client, hf_token, item) for item in nav_data]
         )
-    glimpse_time = time.perf_counter() - glimpse_start
-    print(
-        f"[DEBUG] _fetch_all_glimpses: Fetched {len(result_items)} glimpses in {glimpse_time:.2f}s"
-    )
     return list(result_items)
@@ -130,9 +111,6 @@ def _format_exploration_results(
 async def explore_hf_docs(hf_token: str, endpoint: str) -> str:
     """Main function to explore documentation structure"""
-    start_time = time.perf_counter()
-    print(f"[DEBUG] explore_hf_docs: Starting for endpoint '{endpoint}'")
     # Fetch HTML page
     html_content = await _fetch_html_page(hf_token, endpoint)
@@ -148,9 +126,6 @@ async def explore_hf_docs(hf_token: str, endpoint: str) -> str:
     # Format results
     result = _format_exploration_results(endpoint, result_items)
-    total_time = time.perf_counter() - start_time
-    print(f"[DEBUG] explore_hf_docs: Total time {total_time:.2f}s")
     return result
@@ -199,12 +174,8 @@ async def _fetch_openapi_spec() -> dict[str, Any]:
     global _openapi_spec_cache
     if _openapi_spec_cache is not None:
-        print("[DEBUG] _fetch_openapi_spec: Using cached spec")
         return _openapi_spec_cache
-    start_time = time.perf_counter()
-    print("[DEBUG] _fetch_openapi_spec: Fetching from API")
     url = "https://huggingface.co/.well-known/openapi.json"
     async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
@@ -214,9 +185,6 @@ async def _fetch_openapi_spec() -> dict[str, Any]:
     spec = response.json()
     _openapi_spec_cache = spec
-    fetch_time = time.perf_counter() - start_time
-    print(f"[DEBUG] _fetch_openapi_spec: Fetched and cached in {fetch_time:.2f}s")
     return spec
@@ -457,9 +425,7 @@ async def search_openapi_handler(arguments: dict[str, Any]) -> tuple[str, bool]:
     Returns:
         Tuple of (search_results, success)
     """
-    start_time = time.perf_counter()
     tag = arguments.get("tag", "")
-    print(f"[DEBUG] search_openapi: Starting for tag '{tag}'")
     if not tag:
         return "Error: No tag provided", False
@@ -474,9 +440,6 @@ async def search_openapi_handler(arguments: dict[str, Any]) -> tuple[str, bool]:
         # Format results
         formatted = _format_openapi_results(results, tag)
-        total_time = time.perf_counter() - start_time
-        print(f"[DEBUG] search_openapi: Total time {total_time:.2f}s")
         return formatted, True
     except httpx.HTTPStatusError as e:
@@ -497,9 +460,7 @@ async def hf_docs_fetch_handler(arguments: dict[str, Any]) -> tuple[str, bool]:
     Returns:
         Tuple of (full_markdown_content, success)
     """
-    start_time = time.perf_counter()
     url = arguments.get("url", "")
-    print(f"[DEBUG] fetch_hf_docs: Starting for URL '{url}'")
     if not url:
         return "Error: No URL provided", False
@@ -521,25 +482,15 @@ async def hf_docs_fetch_handler(arguments: dict[str, Any]) -> tuple[str, bool]:
         # Make request with auth
         headers = {"Authorization": f"Bearer {hf_token}"}
-        fetch_start = time.perf_counter()
         async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
             response = await client.get(url, headers=headers)
             response.raise_for_status()
-        fetch_time = time.perf_counter() - fetch_start
         content = response.text
-        content_size_kb = len(content) / 1024
-        print(
-            f"[DEBUG] fetch_hf_docs: Fetched {content_size_kb:.1f}KB in {fetch_time:.2f}s"
-        )
         # Return the markdown content directly
         result = f"Documentation from: {url}\n\n{content}"
-        total_time = time.perf_counter() - start_time
-        print(f"[DEBUG] fetch_hf_docs: Total time {total_time:.2f}s")
         return result, True
     except httpx.HTTPStatusError as e:

 import asyncio
 import os
 from typing import Any
 import httpx
     url = f"{base_url}/{endpoint}"
     headers = {"Authorization": f"Bearer {hf_token}"}
     async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
         response = await client.get(url, headers=headers)
         response.raise_for_status()
     return response.text
 def _parse_sidebar_navigation(html_content: str) -> list[dict[str, str]]:
     """Parse the sidebar navigation and extract all links"""
     soup = BeautifulSoup(html_content, "html.parser")
     sidebar = soup.find("nav", class_=lambda x: x and "flex-auto" in x)
         page_url = f"https://huggingface.co{href}" if href.startswith("/") else href
         nav_data.append({"title": title, "url": page_url})
     return nav_data
     hf_token: str, nav_data: list[dict[str, str]]
 ) -> list[dict[str, str]]:
     """Fetch glimpses for all pages in parallel"""
     async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
         result_items = await asyncio.gather(
             *[_fetch_single_glimpse(client, hf_token, item) for item in nav_data]
         )
     return list(result_items)
 async def explore_hf_docs(hf_token: str, endpoint: str) -> str:
     """Main function to explore documentation structure"""
     # Fetch HTML page
     html_content = await _fetch_html_page(hf_token, endpoint)
     # Format results
     result = _format_exploration_results(endpoint, result_items)
     return result
     global _openapi_spec_cache
     if _openapi_spec_cache is not None:
         return _openapi_spec_cache
     url = "https://huggingface.co/.well-known/openapi.json"
     async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
     spec = response.json()
     _openapi_spec_cache = spec
     return spec
     Returns:
         Tuple of (search_results, success)
     """
     tag = arguments.get("tag", "")
     if not tag:
         return "Error: No tag provided", False
         # Format results
         formatted = _format_openapi_results(results, tag)
         return formatted, True
     except httpx.HTTPStatusError as e:
     Returns:
         Tuple of (full_markdown_content, success)
     """
     url = arguments.get("url", "")
     if not url:
         return "Error: No URL provided", False
         # Make request with auth
         headers = {"Authorization": f"Bearer {hf_token}"}
         async with httpx.AsyncClient(timeout=30.0, follow_redirects=True) as client:
             response = await client.get(url, headers=headers)
             response.raise_for_status()
         content = response.text
         # Return the markdown content directly
         result = f"Documentation from: {url}\n\n{content}"
         return result, True
     except httpx.HTTPStatusError as e: