First_agent_template

Sleeping

LeVinh

fix...

c09239f 3 months ago

27.5 kB

	import os
	import tempfile
	import re
	import json
	import requests
	import cmath
	import uuid
	import numpy as np
	import pandas as pd
	from typing import List, Dict, Any, Optional
	from urllib.parse import urlparse

	from PIL import Image, ImageDraw, ImageFont, ImageEnhance, ImageFilter
	from dotenv import load_dotenv

	import sys
	import types

	# LangChain / LangGraph imports…
	from langgraph.graph import START, StateGraph, MessagesState
	from langgraph.prebuilt import ToolNode, tools_condition

	from langchain_openai import ChatOpenAI
	import base64
	from langchain_tavily import TavilySearch
	from langchain_community.document_loaders import WikipediaLoader, ArxivLoader
	from langchain_community.vectorstores import SupabaseVectorStore
	from langchain_huggingface import (
	ChatHuggingFace,
	HuggingFaceEndpoint,
	HuggingFaceEmbeddings,
	)
	from huggingface_hub import InferenceClient
	from langchain_core.messages import SystemMessage, HumanMessage
	from langchain_core.tools import tool, Tool
	from supabase.client import Client, create_client

	# Local imports
	from code_interpreter import CodeInterpreter
	from img_processing import decode_image, encode_image, save_image
	from dotenv import load_dotenv
	from multimodal_tools import (
	vision_analyze_image,
	vision_analyze_video,
	vision_analyze_document
	)

	load_dotenv()


	interpreter_instance = CodeInterpreter()

	### BROWSER TOOLS

	@tool
	def wiki_search(query: str) -> str:
	"""
	Search Wikipedia for a query and return maximum 2 results.

	Args:
	query (str): The search query.

	Returns:
	str: Formatted search results.
	"""
	search_docs = WikipediaLoader(query=query, load_max_docs=2).load()
	formatted_search_docs = "\n\n---\n\n".join(
	[
	f'<Document source="{doc.metadata["source"]}" page="{doc.metadata.get("page", "")}"/>\n{doc.page_content}\n</Document>'
	for doc in search_docs
	]
	)
	return {"wiki_results": formatted_search_docs}


	@tool
	def web_search(query: str) -> str:
	"""
	Search Tavily for a query and return maximum 3 results.

	Args:
	query (str): The search query.

	Returns:
	str: Formatted search results.
	"""
	search_tool = TavilySearch(max_results=3)
	search_response = search_tool.invoke({"query": query})
	search_docs = search_response.get("results", [])
	formatted_search_docs = "\n\n---\n\n".join(
	[
	f'<Document source="{doc.get("url", "")}" title="{doc.get("title", "")}"/>\n{doc.get("content", "")}\n</Document>'
	for doc in search_docs
	]
	)
	return {"web_results": formatted_search_docs}


	@tool
	def arxiv_search(query: str) -> str:
	"""
	Search Arxiv for a query and return maximum 3 result.

	Args:
	query (str): The search query.

	Returns:
	str: Formatted search results.
	"""
	search_docs = ArxivLoader(query=query, load_max_docs=3).load()
	formatted_search_docs = "\n\n---\n\n".join(
	[
	f'<Document source="{doc.metadata["source"]}" page="{doc.metadata.get("page", "")}"/>\n{doc.page_content[:1000]}\n</Document>'
	for doc in search_docs
	]
	)
	return {"arxiv_results": formatted_search_docs}


	### CODE INTERPRETER TOOLS

	@tool
	def execute_code_multilang(code: str, language: str = "python") -> str:
	"""Execute code in multiple languages (Python, Bash, SQL, C, Java) and return results.
	"""
	# existing implementation remains unchanged
	"""
	Execute code in multiple languages (Python, Bash, SQL, C, Java) and return results.

	Args:
	code (str): The source code to execute.
	language (str): The language of the code. Supported: "python", "bash", "sql", "c", "java".

	Returns:
	str: A string summarizing the execution results.
	"""
	supported_languages = ["python", "bash", "sql", "c", "java"]
	language = language.lower()

	if language not in supported_languages:
	return f"Unsupported language: {language}. Supported languages are: {', '.join(supported_languages)}"

	result = interpreter_instance.execute_code(code, language=language)

	response = []

	if result["status"] == "success":
	response.append(f"--- Code executed successfully in {language.upper()}")

	if result.get("stdout"):
	response.append(
	"\nStandard Output:\n```\n" + result["stdout"].strip() + "\n```"
	)

	if result.get("stderr"):
	response.append(
	"\nStandard Error (if any):\n```\n"
	+ result["stderr"].strip()
	+ "\n```"
	)

	if result.get("result") is not None:
	response.append(
	"\nExecution Result:\n```\n"
	+ str(result["result"]).strip()
	+ "\n```"
	)

	if result.get("dataframes"):
	for df_info in result["dataframes"]:
	response.append(
	f"\nDataFrame `{df_info['name']}` (Shape: {df_info['shape']})"
	)
	df_preview = pd.DataFrame(df_info["head"])
	response.append("First 5 rows:\n```\n" + str(df_preview) + "\n```")

	if result.get("plots"):
	response.append(
	f"\nGenerated {len(result['plots'])} plot(s) (Image data returned separately)"
	)

	else:
	response.append(f" --- Code execution failed in {language.upper()}")
	if result.get("stderr"):
	response.append(
	"\nError Log:\n```\n" + result["stderr"].strip() + "\n```"
	)

	return "\n".join(response)


	### MATHEMATICAL TOOLS

	@tool
	def multiply(a: float, b: float) -> float:
	"""Multiply two numbers."""
	return a * b


	@tool
	def add(a: float, b: float) -> float:
	"""Add two numbers."""
	return a + b


	@tool
	def subtract(a: float, b: float) -> float:
	"""Subtract two numbers."""
	return a - b


	@tool
	def divide(a: float, b: float) -> float:
	"""Divide two numbers."""
	if b == 0:
	raise ValueError("Cannot divide by zero.")
	return a / b


	@tool
	def modulus(a: int, b: int) -> int:
	"""Get the modulus of two numbers."""
	return a % b


	@tool
	def power(a: float, b: float) -> float:
	"""Get the power of two numbers."""
	return a**b


	@tool
	def square_root(a: float) -> float \| complex:
	"""Get the square root of a number."""
	if a >= 0:
	return a**0.5
	return cmath.sqrt(a)


	### DOCUMENT PROCESSING TOOLS

	@tool
	def save_and_read_file(content: str, filename: Optional[str] = None) -> str:
	"""
	Save content to a file and return the path.

	Args:
	content (str): The content to save.
	filename (str, optional): The name of the file.

	Returns:
	str: Success message with file path.
	"""
	temp_dir = tempfile.gettempdir()
	if filename is None:
	temp_file = tempfile.NamedTemporaryFile(delete=False, dir=temp_dir)
	filepath = temp_file.name
	else:
	filepath = os.path.join(temp_dir, filename)

	with open(filepath, "w") as f:
	f.write(content)

	return f"File saved to {filepath}. You can read this file to process its contents."


	@tool
	def download_file_from_url(url: str, filename: Optional[str] = None) -> str:
	"""
	Download a file from a URL.

	Args:
	url (str): The URL of the file.
	filename (str, optional): The name of the file.

	Returns:
	str: Success message with file path or error message.
	"""
	try:
	if not filename:
	path = urlparse(url).path
	filename = os.path.basename(path)
	if not filename:
	filename = f"downloaded_{uuid.uuid4().hex[:8]}"

	temp_dir = tempfile.gettempdir()
	filepath = os.path.join(temp_dir, filename)

	response = requests.get(url, stream=True)
	response.raise_for_status()

	with open(filepath, "wb") as f:
	for chunk in response.iter_content(chunk_size=8192):
	f.write(chunk)

	return f"File downloaded to {filepath}. You can read this file to process its contents."
	except Exception as e:
	return f"Error downloading file: {str(e)}"


	@tool
	def extract_text_from_image(image_path: str) -> str:
	"""
	Extract text from an image using AI Vision (OCR).

	Args:
	image_path (str): The path to the image file.

	Returns:
	str: Extracted text or error message.
	"""
	return vision_analyze_image("Transcribe all text from this image verbatim.", image_path)


	@tool
	def analyze_csv_file(file_path: str, query: str) -> str:
	"""
	Analyze a CSV file using pandas.

	Args:
	file_path (str): The path to the CSV file.
	query (str): Question about the data.

	Returns:
	str: Analysis result or error message.
	"""
	try:
	df = pd.read_csv(file_path)
	result = f"CSV file loaded with {len(df)} rows and {len(df.columns)} columns.\n"
	result += f"Columns: {', '.join(df.columns)}\n\n"
	result += "Summary statistics:\n"
	result += str(df.describe())
	return result
	except Exception as e:
	return f"Error analyzing CSV file: {str(e)}"


	@tool
	def analyze_excel_file(file_path: str, query: str) -> str:
	"""
	Analyze an Excel file using pandas.

	Args:
	file_path (str): The path to the Excel file.
	query (str): Question about the data.

	Returns:
	str: Analysis result or error message.
	"""
	try:
	df = pd.read_excel(file_path)
	result = (
	f"Excel file loaded with {len(df)} rows and {len(df.columns)} columns.\n"
	)
	result += f"Columns: {', '.join(df.columns)}\n\n"
	result += "Summary statistics:\n"
	result += str(df.describe())
	return result
	except Exception as e:
	return f"Error analyzing Excel file: {str(e)}"


	### IMAGE PROCESSING AND GENERATION TOOLS
	@tool
	def analyze_image(image_base64: str) -> Dict[str, Any]:
	"""
	Analyze basic properties of an image.

	Args:
	image_base64 (str): Base64 encoded image string.

	Returns:
	Dict[str, Any]: Dictionary with analysis result.
	"""
	try:
	img = decode_image(image_base64)
	width, height = img.size
	mode = img.mode

	if mode in ("RGB", "RGBA"):
	arr = np.array(img)
	avg_colors = arr.mean(axis=(0, 1))
	dominant = ["Red", "Green", "Blue"][np.argmax(avg_colors[:3])]
	brightness = avg_colors.mean()
	color_analysis = {
	"average_rgb": avg_colors.tolist(),
	"brightness": brightness,
	"dominant_color": dominant,
	}
	else:
	color_analysis = {"note": f"No color analysis for mode {mode}"}

	thumbnail = img.copy()
	thumbnail.thumbnail((100, 100))
	thumb_path = save_image(thumbnail, "thumbnails")
	thumbnail_base64 = encode_image(thumb_path)

	return {
	"dimensions": (width, height),
	"mode": mode,
	"color_analysis": color_analysis,
	"thumbnail": thumbnail_base64,
	}
	except Exception as e:
	return {"error": str(e)}


	@tool
	def transform_image(
	image_base64: str, operation: str, params: Optional[Dict[str, Any]] = None
	) -> Dict[str, Any]:
	"""
	Apply transformations to an image.

	Args:
	image_base64 (str): Base64 encoded input image.
	operation (str): Transformation operation (resize, rotate, crop, flip, adjust_brightness, adjust_contrast, blur, sharpen, grayscale).
	params (Dict[str, Any], optional): Parameters for the operation.

	Returns:
	Dict[str, Any]: Dictionary with transformed image (base64).
	"""
	try:
	img = decode_image(image_base64)
	params = params or {}

	if operation == "resize":
	img = img.resize(
	(
	params.get("width", img.width // 2),
	params.get("height", img.height // 2),
	)
	)
	elif operation == "rotate":
	img = img.rotate(params.get("angle", 90), expand=True)
	elif operation == "crop":
	img = img.crop(
	(
	params.get("left", 0),
	params.get("top", 0),
	params.get("right", img.width),
	params.get("bottom", img.height),
	)
	)
	elif operation == "flip":
	if params.get("direction", "horizontal") == "horizontal":
	img = img.transpose(Image.FLIP_LEFT_RIGHT)
	else:
	img = img.transpose(Image.FLIP_TOP_BOTTOM)
	elif operation == "adjust_brightness":
	img = ImageEnhance.Brightness(img).enhance(params.get("factor", 1.5))
	elif operation == "adjust_contrast":
	img = ImageEnhance.Contrast(img).enhance(params.get("factor", 1.5))
	elif operation == "blur":
	img = img.filter(ImageFilter.GaussianBlur(params.get("radius", 2)))
	elif operation == "sharpen":
	img = img.filter(ImageFilter.SHARPEN)
	elif operation == "grayscale":
	img = img.convert("L")
	else:
	return {"error": f"Unknown operation: {operation}"}

	result_path = save_image(img)
	result_base64 = encode_image(result_path)
	return {"transformed_image": result_base64}

	except Exception as e:
	return {"error": str(e)}


	@tool
	def draw_on_image(
	image_base64: str, drawing_type: str, params: Dict[str, Any]
	) -> Dict[str, Any]:
	"""
	Draw shapes or text onto an image.

	Args:
	image_base64 (str): Base64 encoded input image.
	drawing_type (str): Drawing type (rectangle, circle, line, text).
	params (Dict[str, Any]): Drawing parameters.

	Returns:
	Dict[str, Any]: Dictionary with result image (base64).
	"""
	try:
	img = decode_image(image_base64)
	draw = ImageDraw.Draw(img)
	color = params.get("color", "red")

	if drawing_type == "rectangle":
	draw.rectangle(
	[params["left"], params["top"], params["right"], params["bottom"]],
	outline=color,
	width=params.get("width", 2),
	)
	elif drawing_type == "circle":
	x, y, r = params["x"], params["y"], params["radius"]
	draw.ellipse(
	(x - r, y - r, x + r, y + r),
	outline=color,
	width=params.get("width", 2),
	)
	elif drawing_type == "line":
	draw.line(
	(
	params["start_x"],
	params["start_y"],
	params["end_x"],
	params["end_y"],
	),
	fill=color,
	width=params.get("width", 2),
	)
	elif drawing_type == "text":
	font_size = params.get("font_size", 20)
	try:
	font = ImageFont.truetype("arial.ttf", font_size)
	except IOError:
	font = ImageFont.load_default()
	draw.text(
	(params["x"], params["y"]),
	params.get("text", "Text"),
	fill=color,
	font=font,
	)
	else:
	return {"error": f"Unknown drawing type: {drawing_type}"}

	result_path = save_image(img)
	result_base64 = encode_image(result_path)
	return {"result_image": result_base64}

	except Exception as e:
	return {"error": str(e)}


	@tool
	def generate_simple_image(
	image_type: str,
	width: int = 500,
	height: int = 500,
	params: Optional[Dict[str, Any]] = None,
	) -> Dict[str, Any]:
	"""
	Generate a simple image.

	Args:
	image_type (str): Type of image (gradient, noise).
	width (int): Width of the image. Defaults to 500.
	height (int): Height of the image. Defaults to 500.
	params (Dict[str, Any], optional): Specific parameters.

	Returns:
	Dict[str, Any]: Dictionary with generated image (base64).
	"""
	try:
	params = params or {}

	if image_type == "gradient":
	direction = params.get("direction", "horizontal")
	start_color = params.get("start_color", (255, 0, 0))
	end_color = params.get("end_color", (0, 0, 255))

	img = Image.new("RGB", (width, height))
	draw = ImageDraw.Draw(img)

	if direction == "horizontal":
	for x in range(width):
	r = int(
	start_color[0] + (end_color[0] - start_color[0]) * x / width
	)
	g = int(
	start_color[1] + (end_color[1] - start_color[1]) * x / width
	)
	b = int(
	start_color[2] + (end_color[2] - start_color[2]) * x / width
	)
	draw.line([(x, 0), (x, height)], fill=(r, g, b))
	else:
	for y in range(height):
	r = int(
	start_color[0] + (end_color[0] - start_color[0]) * y / height
	)
	g = int(
	start_color[1] + (end_color[1] - start_color[1]) * y / height
	)
	b = int(
	start_color[2] + (end_color[2] - start_color[2]) * y / height
	)
	draw.line([(0, y), (width, y)], fill=(r, g, b))

	elif image_type == "noise":
	noise_array = np.random.randint(0, 256, (height, width, 3), dtype=np.uint8)
	img = Image.fromarray(noise_array, "RGB")

	else:
	return {"error": f"Unsupported image_type {image_type}"}

	result_path = save_image(img)
	result_base64 = encode_image(result_path)
	return {"generated_image": result_base64}

	except Exception as e:
	return {"error": str(e)}


	@tool
	def combine_images(
	images_base64: List[str], operation: str, params: Optional[Dict[str, Any]] = None
	) -> Dict[str, Any]:
	"""
	Combine multiple images.

	Args:
	images_base64 (List[str]): List of base64 images.
	operation (str): Combination type (stack).
	params (Dict[str, Any], optional): Parameters.

	Returns:
	Dict[str, Any]: Dictionary with combined image (base64).
	"""
	try:
	images = [decode_image(b64) for b64 in images_base64]
	params = params or {}

	if operation == "stack":
	direction = params.get("direction", "horizontal")
	if direction == "horizontal":
	total_width = sum(img.width for img in images)
	max_height = max(img.height for img in images)
	new_img = Image.new("RGB", (total_width, max_height))
	x = 0
	for img in images:
	new_img.paste(img, (x, 0))
	x += img.width
	else:
	max_width = max(img.width for img in images)
	total_height = sum(img.height for img in images)
	new_img = Image.new("RGB", (max_width, total_height))
	y = 0
	for img in images:
	new_img.paste(img, (0, y))
	y += img.height
	else:
	return {"error": f"Unsupported combination operation {operation}"}

	result_path = save_image(new_img)
	result_base64 = encode_image(result_path)
	return {"combined_image": result_base64}

	except Exception as e:
	return {"error": str(e)}


	# Load system prompt
	with open("system_prompt.txt", "r", encoding="utf-8") as f:
	system_prompt = f.read()

	# System message
	sys_msg = SystemMessage(content=system_prompt)



	# Build retriever and tools
	embeddings = HuggingFaceEmbeddings(
	model_name="sentence-transformers/all-mpnet-base-v2"
	)

	# Initialize base tools
	tools = [
	web_search,
	wiki_search,
	arxiv_search,
	multiply,
	add,
	subtract,
	divide,
	modulus,
	power,
	square_root,
	save_and_read_file,
	download_file_from_url,
	extract_text_from_image,
	analyze_csv_file,
	analyze_excel_file,
	execute_code_multilang,
	analyze_image,

	transform_image,
	draw_on_image,
	generate_simple_image,
	combine_images,

	# Multimodal vision tools (OpenRouter)
	vision_analyze_image,
	vision_analyze_video,
	vision_analyze_document,
	]


	# Conditionally add Supabase tool
	supabase_url = os.environ.get("SUPABASE_URL")
	supabase_key = os.environ.get("SUPABASE_SERVICE_ROLE_KEY")

	vector_store = None
	if supabase_url and supabase_key:
	try:
	supabase: Client = create_client(supabase_url, supabase_key)
	vector_store = SupabaseVectorStore(
	client=supabase,
	embedding=embeddings,
	table_name="documents2",
	query_name="match_documents_2",
	)
	retriever = vector_store.as_retriever()
	retriever_tool = Tool(
	name="question_search",
	func=retriever.invoke,
	description="A tool to retrieve similar questions from a vector store.",
	)
	tools.insert(0, retriever_tool)
	print("Supabase retriever tool initialized.")
	except Exception as e:
	print(f"Failed to initialize Supabase retriever: {e}")
	vector_store = None
	else:
	print("Supabase credentials not found. 'Question Search' tool will be disabled.")


	def load_config() -> Dict[str, Any]:
	"""Load configuration from agent.json."""
	try:
	with open("agent.json", "r") as f:
	return json.load(f)
	except FileNotFoundError:
	print("agent.json not found. Using default configuration.")
	return {}
	except json.JSONDecodeError:
	print("Error decoding agent.json. Using default configuration.")
	return {}

	def build_graph(provider: str = None):
	"""
	Build the state graph for the agent.

	Args:
	provider (str): The LLM provider. If None, loaded from agent.json.

	Returns:
	CompiledGraph: The compiled state graph.
	"""
	config = load_config()
	model_config = config.get("model", {})
	model_class = model_config.get("class")
	model_data = model_config.get("data", {})

	# Determine provider from config if not explicitly passed
	if provider is None:
	if "HfApiModel" in str(model_class):
	provider = "huggingface"
	elif "OpenAI" in str(model_class) or "ChatOpenAI" in str(model_class):
	provider = "openai"
	else:
	# Default fallback
	provider = "openai" # Default to openai as fallback

	if provider == "huggingface":
	# All config must come from agent.json
	if "model_id" not in model_data:
	raise ValueError("model_id is required in agent.json for HuggingFace provider")

	model_id = model_data["model_id"]

	# Parse provider suffix from model_id (e.g., "Qwen/Qwen3-32B:cerebras")
	# Format: "model_name" or "model_name:provider"
	if ":" in model_id:
	# Use router for third-party providers (cerebras, novita, etc.)
	model_name, provider_suffix = model_id.rsplit(":", 1)
	print(f"Using HuggingFace Router with model: {model_name}, provider: {provider_suffix}")

	api_key = os.getenv("HF_TOKEN")
	if not api_key:
	raise ValueError("HF_TOKEN not found in environment variables")

	# Use router for third-party providers
	llm = ChatOpenAI(
	model=model_id, # Full model_id with provider suffix
	base_url="https://router.huggingface.co/v1",
	api_key=api_key,
	max_tokens=model_data.get("max_tokens", 4096),
	temperature=model_data.get("temperature", 0.01),
	)
	else:
	# Use free serverless inference (no provider suffix)
	print(f"Using HuggingFace Serverless Inference with model: {model_id}")

	# Construct the serverless inference API URL to bypass router
	# Format: https://api-inference.huggingface.co/models/{model_id}
	serverless_url = f"https://api-inference.huggingface.co/models/{model_id}"

	llm = ChatHuggingFace(
	llm=HuggingFaceEndpoint(
	endpoint_url=serverless_url, # Use direct serverless API
	task="text-generation",
	max_new_tokens=model_data.get("max_tokens", 4096),
	do_sample=False,
	repetition_penalty=1.03,
	temperature=model_data.get("temperature", 0.01),
	),
	verbose=True,
	)
	elif provider == "openai":
	# All config must come from agent.json
	if "model_id" not in model_data:
	raise ValueError("model_id is required in agent.json for OpenAI provider")

	model_id = model_data["model_id"]
	api_key_env = model_data.get("api_key_env", "OPENAI_API_KEY") # Keep this default for compatibility
	api_key = os.getenv(api_key_env)
	if not api_key:
	raise ValueError(f"{api_key_env} not found in environment variables")

	llm = ChatOpenAI(
	model=model_id,
	base_url=model_data.get("base_url"),
	api_key=api_key,
	max_tokens=model_data.get("max_tokens", 4096),
	temperature=model_data.get("temperature", 0.01),
	)
	print(f"Using OpenAI-compatible provider with model: {model_id}")

	else:
	# Fallback or error if other providers are requested but not implemented
	raise ValueError(f"Invalid provider: {provider}. Supported: 'huggingface', 'openai'.")

	llm_with_tools = llm.bind_tools(tools)

	def assistant(state: MessagesState):
	"""Assistant node to invoke the LLM."""
	return {"messages": [llm_with_tools.invoke(state["messages"])]}

	def retriever(state: MessagesState):
	"""Retriever node to find similar questions."""
	# Retriever disabled to avoid Supabase connection issues
	return {"messages": [sys_msg] + state["messages"]}

	builder = StateGraph(MessagesState)
	builder.add_node("retriever", retriever)
	builder.add_node("assistant", assistant)
	builder.add_node("tools", ToolNode(tools))
	builder.add_edge(START, "retriever")
	builder.add_edge("retriever", "assistant")
	builder.add_conditional_edges("assistant", tools_condition)
	builder.add_edge("tools", "assistant")

	return builder.compile()


	if __name__ == "__main__":
	question = "When was a picture of St. Thomas Aquinas first added to the Wikipedia page on the Principle of double effect?"
	# provider=None will trigger loading from agent.json
	graph = build_graph(provider=None)
	messages = [HumanMessage(content=question)]
	messages = graph.invoke({"messages": messages})
	for m in messages["messages"]:
	m.pretty_print()