Spaces:

smolagents
/

ml-intern

Running on CPU Upgrade

App Files Files Community

Henri Bonamy commited on Dec 26, 2025

Commit

160da13

1 Parent(s): a82c70a

pass ToolErrors to agent, correct HF token handling, simplify uv job calls

Browse files

Files changed (3) hide show

agent/core/tools.py +9 -4
agent/prompts/system_prompt.yaml +1 -0
agent/tools/jobs_tool.py +65 -16

agent/core/tools.py CHANGED Viewed

@@ -8,6 +8,7 @@ from dataclasses import dataclass
 from typing import Any, Awaitable, Callable, Optional
 from fastmcp import Client
 from lmnr import observe
 from mcp.types import EmbeddedResource, ImageContent, TextContent
@@ -166,10 +167,14 @@ class ToolRouter:
         # Otherwise, use MCP client
         if self._mcp_initialized:
-            result = await self.mcp_client.call_tool(tool_name, arguments)
-            # Convert MCP content blocks to string
-            output = convert_mcp_content_to_string(result.content)
-            return output, not result.is_error
         return "MCP client not initialized", False

 from typing import Any, Awaitable, Callable, Optional
 from fastmcp import Client
+from fastmcp.exceptions import ToolError
 from lmnr import observe
 from mcp.types import EmbeddedResource, ImageContent, TextContent
         # Otherwise, use MCP client
         if self._mcp_initialized:
+            try:
+                result = await self.mcp_client.call_tool(tool_name, arguments)
+                output = convert_mcp_content_to_string(result.content)
+                return output, not result.is_error
+            except ToolError as e:
+                # Catch MCP tool errors and return them to the agent
+                error_msg = f"Tool error: {str(e)}"
+                return error_msg, False
         return "MCP client not initialized", False

agent/prompts/system_prompt.yaml CHANGED Viewed

@@ -85,6 +85,7 @@ system_prompt: |
   - Always search Hugging Face Hub for existing resources before suggesting custom implementations
   - When referencing models, datasets, or papers, include direct links from search results
   - Never assume a library is available - check documentation first
   - Follow ML best practices: proper train/val/test splits, reproducibility, evaluation metrics
   - For training tasks, consider compute requirements and suggest appropriate hardware
   - Never expose or log API keys, tokens, or secrets

   - Always search Hugging Face Hub for existing resources before suggesting custom implementations
   - When referencing models, datasets, or papers, include direct links from search results
   - Never assume a library is available - check documentation first
+  - Before processing any dataset: inspect its actual structure first using the mcp__hf-mcp-server__hub_repo_details tool. Never assume column names: verify them beforehand.
   - Follow ML best practices: proper train/val/test splits, reproducibility, evaluation metrics
   - For training tasks, consider compute requirements and suggest appropriate hardware
   - Never expose or log API keys, tokens, or secrets

agent/tools/jobs_tool.py CHANGED Viewed

@@ -6,6 +6,7 @@ Refactored to use official huggingface-hub library instead of custom HTTP client
 import asyncio
 import base64
 from typing import Any, Dict, Literal, Optional
 from huggingface_hub import HfApi
@@ -60,6 +61,29 @@ OperationType = Literal[
 UV_DEFAULT_IMAGE = "ghcr.io/astral-sh/uv:python3.12-bookworm"
 def _build_uv_command(
     script: str,
     with_deps: list[str] | None = None,
@@ -99,6 +123,20 @@ def _wrap_inline_script(
     return f'echo "{encoded}" | base64 -d | {uv_command_str}'
 def _resolve_uv_command(
     script: str,
     with_deps: list[str] | None = None,
@@ -332,7 +370,6 @@ Call this tool with:
 **String format (simple cases only):**
 - Still accepted for backwards compatibility, parsed with POSIX shell semantics
 - Rejects shell operators and can mis-handle characters such as `&`; switch to arrays when things turn complex
-- `$HF_TOKEN` stays literal—forward it via `secrets: {{ "HF_TOKEN": "$HF_TOKEN" }}`
 ### Show command-specific help
 Call this tool with:
@@ -344,7 +381,7 @@ Call this tool with:
 - Jobs default to non-detached mode (stream logs until completion). Set `detach: true` to return immediately.
 - Prefer array commands to avoid shell parsing surprises
-- To access private Hub assets, include `secrets: {{ "HF_TOKEN": "$HF_TOKEN" }}` to inject your auth token.
 - Before calling a job, think about dependencies (they must be specified), which hardware flavor to run on (choose simplest for task), and whether to include secrets.
 """
         return {"formatted": usage_text, "totalResults": 1, "resultsShared": 1}
@@ -388,8 +425,8 @@ Call this tool with:
                 self.api.run_job,
                 image=args.get("image", "python:3.12"),
                 command=args.get("command"),
-                env=args.get("env"),
-                secrets=args.get("secrets"),
                 flavor=args.get("flavor", "cpu-basic"),
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,
@@ -441,12 +478,18 @@ To inspect, call this tool with `{{"operation": "inspect", "args": {{"job_id": "
             if not script:
                 raise ValueError("script is required")
             # Resolve the command based on script type (URL, inline, or file)
             command = _resolve_uv_command(
                 script=script,
-                with_deps=args.get("with_deps")
-                or args.get("dependencies")
-                or args.get("packages"),
                 python=args.get("python"),
                 script_args=args.get("script_args"),
             )
@@ -456,8 +499,8 @@ To inspect, call this tool with `{{"operation": "inspect", "args": {{"job_id": "
                 self.api.run_job,
                 image=UV_DEFAULT_IMAGE,
                 command=command,
-                env=args.get("env"),
-                secrets=args.get("secrets"),
                 flavor=args.get("flavor") or args.get("hardware") or "cpu-basic",
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,
@@ -645,8 +688,8 @@ To verify, call this tool with `{{"operation": "inspect", "args": {{"job_id": "{
                 image=args.get("image", "python:3.12"),
                 command=args.get("command"),
                 schedule=args.get("schedule"),
-                env=args.get("env"),
-                secrets=args.get("secrets"),
                 flavor=args.get("flavor", "cpu-basic"),
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,
@@ -680,12 +723,18 @@ To list all, call this tool with `{{"operation": "scheduled ps"}}`"""
             if not schedule:
                 raise ValueError("schedule is required")
             # Resolve the command based on script type
             command = _resolve_uv_command(
                 script=script,
-                with_deps=args.get("with_deps")
-                or args.get("dependencies")
-                or args.get("packages"),
                 python=args.get("python"),
                 script_args=args.get("script_args"),
             )
@@ -696,8 +745,8 @@ To list all, call this tool with `{{"operation": "scheduled ps"}}`"""
                 image=UV_DEFAULT_IMAGE,
                 command=command,
                 schedule=schedule,
-                env=args.get("env"),
-                secrets=args.get("secrets"),
                 flavor=args.get("flavor") or args.get("hardware") or "cpu-basic",
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,

 import asyncio
 import base64
+import os
 from typing import Any, Dict, Literal, Optional
 from huggingface_hub import HfApi
 UV_DEFAULT_IMAGE = "ghcr.io/astral-sh/uv:python3.12-bookworm"
+def _substitute_hf_token(params: Dict[str, Any] | None) -> Dict[str, Any] | None:
+    """
+    Substitute $HF_TOKEN with actual token value from environment.
+    Args:
+        params: Dictionary that may contain "$HF_TOKEN" in values
+    Returns:
+        Dictionary with $HF_TOKEN substituted
+    """
+    if params is None:
+        return None
+    result = {}
+    for key, value in params.items():
+        if value == "$HF_TOKEN":
+            result[key] = os.environ.get("HF_TOKEN", "")
+        else:
+            result[key] = value
+    return result
 def _build_uv_command(
     script: str,
     with_deps: list[str] | None = None,
     return f'echo "{encoded}" | base64 -d | {uv_command_str}'
+def _ensure_hf_transfer_dependency(deps: list[str] | None) -> list[str]:
+    """Ensure hf-transfer is included in the dependencies list"""
+    if deps is None:
+        return ["hf-transfer"]
+    if isinstance(deps, list):
+        deps_copy = deps.copy()  # Don't modify the original
+        if "hf-transfer" not in deps_copy:
+            deps_copy.append("hf-transfer")
+        return deps_copy
+    return ["hf-transfer"]
 def _resolve_uv_command(
     script: str,
     with_deps: list[str] | None = None,
 **String format (simple cases only):**
 - Still accepted for backwards compatibility, parsed with POSIX shell semantics
 - Rejects shell operators and can mis-handle characters such as `&`; switch to arrays when things turn complex
 ### Show command-specific help
 Call this tool with:
 - Jobs default to non-detached mode (stream logs until completion). Set `detach: true` to return immediately.
 - Prefer array commands to avoid shell parsing surprises
+- To access private Hub assets (spaces, private models, datasets, collections), pass `secrets: {{ "HF_TOKEN": "$HF_TOKEN" }}`
 - Before calling a job, think about dependencies (they must be specified), which hardware flavor to run on (choose simplest for task), and whether to include secrets.
 """
         return {"formatted": usage_text, "totalResults": 1, "resultsShared": 1}
                 self.api.run_job,
                 image=args.get("image", "python:3.12"),
                 command=args.get("command"),
+                env=_substitute_hf_token(args.get("env")),
+                secrets=_substitute_hf_token(args.get("secrets")),
                 flavor=args.get("flavor", "cpu-basic"),
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,
             if not script:
                 raise ValueError("script is required")
+            # Get dependencies and ensure hf-transfer is included
+            deps = (
+                args.get("with_deps")
+                or args.get("dependencies")
+                or args.get("packages")
+            )
+            deps = _ensure_hf_transfer_dependency(deps)
             # Resolve the command based on script type (URL, inline, or file)
             command = _resolve_uv_command(
                 script=script,
+                with_deps=deps,
                 python=args.get("python"),
                 script_args=args.get("script_args"),
             )
                 self.api.run_job,
                 image=UV_DEFAULT_IMAGE,
                 command=command,
+                env=_substitute_hf_token(args.get("env")),
+                secrets=_substitute_hf_token(args.get("secrets")),
                 flavor=args.get("flavor") or args.get("hardware") or "cpu-basic",
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,
                 image=args.get("image", "python:3.12"),
                 command=args.get("command"),
                 schedule=args.get("schedule"),
+                env=_substitute_hf_token(args.get("env")),
+                secrets=_substitute_hf_token(args.get("secrets")),
                 flavor=args.get("flavor", "cpu-basic"),
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,
             if not schedule:
                 raise ValueError("schedule is required")
+            # Get dependencies and ensure hf-transfer is included
+            deps = (
+                args.get("with_deps")
+                or args.get("dependencies")
+                or args.get("packages")
+            )
+            deps = _ensure_hf_transfer_dependency(deps)
             # Resolve the command based on script type
             command = _resolve_uv_command(
                 script=script,
+                with_deps=deps,
                 python=args.get("python"),
                 script_args=args.get("script_args"),
             )
                 image=UV_DEFAULT_IMAGE,
                 command=command,
                 schedule=schedule,
+                env=_substitute_hf_token(args.get("env")),
+                secrets=_substitute_hf_token(args.get("secrets")),
                 flavor=args.get("flavor") or args.get("hardware") or "cpu-basic",
                 timeout=args.get("timeout", "30m"),
                 namespace=args.get("namespace") or self.namespace,