| import requests |
| import os |
| from typing import Dict, Any, Optional, List |
| from .search_base import SearchBase |
| from .tool import Tool,Toolkit |
| from evoagentx.core.logging import logger |
| import dotenv |
| dotenv.load_dotenv() |
|
|
| class SearchGoogle(SearchBase): |
|
|
| def __init__( |
| self, |
| name: str = 'SearchGoogle', |
| num_search_pages: Optional[int] = 5, |
| max_content_words: Optional[int] = None, |
| **kwargs |
| ): |
| """ |
| Initialize the Google Search tool. |
| |
| Args: |
| name (str): The name of the search tool |
| num_search_pages (int): Number of search results to retrieve |
| max_content_words (int, optional): Maximum number of words to include in content, None means no limit |
| **kwargs: Additional data to pass to the parent class |
| """ |
| |
| super().__init__(name=name, num_search_pages=num_search_pages, max_content_words=max_content_words, **kwargs) |
| |
| def search(self, query: str, num_search_pages: int = None, max_content_words: int = None) -> Dict[str, Any]: |
| """ |
| Search Google using the Custom Search API and retrieve detailed search results with content snippets. |
| |
| Args: |
| query (str): The search query to execute on Google |
| num_search_pages (int): Number of search results to retrieve |
| max_content_words (int): Maximum number of words to include in content, None means no limit |
| |
| Returns: |
| Dict[str, Any]: Contains search results and optional error message |
| """ |
| num_search_pages = num_search_pages or self.num_search_pages |
| max_content_words = max_content_words or self.max_content_words |
| results = [] |
| |
| |
| api_key = os.getenv('GOOGLE_API_KEY', '') |
| search_engine_id = os.getenv('GOOGLE_SEARCH_ENGINE_ID', '') |
| |
| |
| |
| |
| if not api_key or not search_engine_id: |
| error_msg = ( |
| "API key and search engine ID are required. " |
| "Please set GOOGLE_API_KEY and GOOGLE_SEARCH_ENGINE_ID environment variables. " |
| "You can get these from the Google Cloud Console: https://console.cloud.google.com/apis/" |
| ) |
| logger.error(error_msg) |
| return {"results": [], "error": error_msg} |
| |
| try: |
| |
| logger.info(f"Searching Google for: {query}, num_results={num_search_pages}, max_content_words={max_content_words}") |
| search_url = "https://www.googleapis.com/customsearch/v1" |
| params = { |
| "key": api_key, |
| "cx": search_engine_id, |
| "q": query, |
| "num": num_search_pages, |
| } |
| response = requests.get(search_url, params=params) |
| data = response.json() |
|
|
| if "items" not in data: |
| return {"results": [], "error": "No search results found."} |
|
|
| search_results = data["items"] |
| logger.info(f"Found {len(search_results)} search results") |
|
|
| |
| for item in search_results: |
| url = item["link"] |
| title = item["title"] |
| try: |
| title, content = self._scrape_page(url) |
| if content: |
| |
| display_content = self._truncate_content(content, max_content_words) |
| |
| results.append({ |
| "title": title, |
| "content": display_content, |
| "url": url, |
| }) |
| except Exception as e: |
| logger.warning(f"Error processing URL {url}: {str(e)}") |
| continue |
|
|
| return {"results": results, "error": None} |
|
|
| except Exception as e: |
| logger.error(f"Error searching Google: {str(e)}") |
| return {"results": [], "error": str(e)} |
|
|
|
|
| class GoogleSearchTool(Tool): |
| name: str = "google_search" |
| description: str = "Search Google using the Custom Search API and retrieve content from search results" |
| inputs: Dict[str, Dict[str, str]] = { |
| "query": { |
| "type": "string", |
| "description": "The search query to execute on Google" |
| }, |
| "num_search_pages": { |
| "type": "integer", |
| "description": "Number of search results to retrieve. Default: 5" |
| }, |
| "max_content_words": { |
| "type": "integer", |
| "description": "Maximum number of words to include in content per result. None means no limit. Default: None" |
| } |
| } |
| required: Optional[List[str]] = ["query"] |
| |
| def __init__(self, search_google: SearchGoogle = None): |
| super().__init__() |
| self.search_google = search_google |
| |
| def __call__(self, query: str, num_search_pages: int = None, max_content_words: int = None) -> Dict[str, Any]: |
| """Execute Google search using the SearchGoogle instance.""" |
| if not self.search_google: |
| raise RuntimeError("Google search instance not initialized") |
| |
| try: |
| return self.search_google.search(query, num_search_pages, max_content_words) |
| except Exception as e: |
| return {"results": [], "error": f"Error executing Google search: {str(e)}"} |
|
|
|
|
| class GoogleSearchToolkit(Toolkit): |
| def __init__( |
| self, |
| name: str = "GoogleSearchToolkit", |
| num_search_pages: Optional[int] = 5, |
| max_content_words: Optional[int] = None, |
| **kwargs |
| ): |
| |
| search_google = SearchGoogle( |
| name="SearchGoogle", |
| num_search_pages=num_search_pages, |
| max_content_words=max_content_words, |
| **kwargs |
| ) |
| |
| |
| tools = [ |
| GoogleSearchTool(search_google=search_google) |
| ] |
| |
| |
| super().__init__(name=name, tools=tools) |
| |
| |
| self.search_google = search_google |
| |
|
|