| """ |
| Grafo principal do LangGraph para o AgentGraph |
| """ |
| import logging |
| import pandas as pd |
| import re |
| from typing import Dict, Any, Optional |
| from langgraph.graph import StateGraph, END |
| from langgraph.checkpoint.memory import MemorySaver |
| from sqlalchemy import Integer, Float, DateTime |
|
|
| from nodes.agent_node import ( |
| AgentState, |
| should_refine_response, |
| should_generate_graph, |
| should_use_processing_agent, |
| route_after_cache_check |
| ) |
| from nodes.csv_processing_node import csv_processing_node |
| from nodes.database_node import ( |
| create_database_from_dataframe_node, |
| load_existing_database_node, |
| get_database_sample_node |
| ) |
| from nodes.query_node import ( |
| validate_query_input_node, |
| prepare_query_context_node, |
| process_user_query_node |
| ) |
| from nodes.refinement_node import ( |
| refine_response_node, |
| format_final_response_node |
| ) |
| from nodes.processing_node import ( |
| process_initial_context_node, |
| validate_processing_input_node |
| ) |
| from nodes.cache_node import ( |
| check_cache_node, |
| cache_response_node, |
| update_history_node |
| ) |
| from nodes.graph_selection_node import graph_selection_node |
| from nodes.graph_generation_node import graph_generation_node |
| from nodes.custom_nodes import CustomNodeManager |
| from nodes.connection_selection_node import ( |
| connection_selection_node, |
| validate_connection_input_node, |
| route_by_connection_type |
| ) |
| from nodes.postgresql_connection_node import postgresql_connection_node |
| from agents.sql_agent import SQLAgentManager |
| from agents.tools import CacheManager |
| from utils.database import create_sql_database |
| from utils.config import get_active_csv_path, SQL_DB_PATH |
| from utils.object_manager import get_object_manager |
|
|
| class AgentGraphManager: |
| """ |
| Gerenciador principal do grafo LangGraph |
| """ |
| |
| def __init__(self): |
| self.graph = None |
| self.app = None |
| self.cache_manager = CacheManager() |
| self.custom_node_manager = CustomNodeManager() |
| self.object_manager = get_object_manager() |
| self.engine = None |
| self.sql_agent = None |
| self.db = None |
| |
| self.agent_id = None |
| self.engine_id = None |
| self.db_id = None |
| self.cache_id = None |
| self._initialize_system() |
| self._build_graph() |
| |
| def _initialize_system(self): |
| """Inicializa o sistema com banco e agente padrão""" |
| try: |
| |
| |
| import os |
| from sqlalchemy import create_engine |
|
|
| |
| if os.path.exists(SQL_DB_PATH): |
| |
| self.engine = create_engine(f"sqlite:///{SQL_DB_PATH}") |
| db = create_sql_database(self.engine) |
| logging.info("Banco existente carregado") |
| else: |
| |
| csv_path = get_active_csv_path() |
| self.engine = self._create_engine_sync(csv_path) |
| db = create_sql_database(self.engine) |
| logging.info("Novo banco criado") |
|
|
| |
| self.db = db |
| self.db_id = self.object_manager.store_database(db) |
|
|
| |
| self.sql_agent = SQLAgentManager(db, single_table_mode=False, selected_table=None) |
|
|
| |
| self.agent_id = self.object_manager.store_sql_agent(self.sql_agent, self.db_id) |
| self.engine_id = self.object_manager.store_engine(self.engine) |
| self.cache_id = self.object_manager.store_cache_manager(self.cache_manager) |
|
|
| logging.info("Sistema inicializado com sucesso") |
|
|
| except Exception as e: |
| logging.error(f"Erro ao inicializar sistema: {e}") |
| raise |
|
|
| def _create_engine_sync(self, csv_path: str): |
| """Cria engine de forma síncrona para inicialização""" |
| import pandas as pd |
| from sqlalchemy import create_engine |
| from sqlalchemy.types import DateTime, Integer, Float |
|
|
| |
| df = pd.read_csv(csv_path, sep=';') |
|
|
| |
| sql_types = {} |
| df = self._smart_type_conversion(df, sql_types) |
|
|
| |
| engine = create_engine(f"sqlite:///{SQL_DB_PATH}") |
| df.to_sql("tabela", engine, index=False, if_exists="replace", dtype=sql_types) |
|
|
| logging.info(f"Banco criado com {len(df)} registros") |
| return engine |
| |
| def _build_graph(self): |
| """Constrói o grafo LangGraph com nova arquitetura""" |
| try: |
| |
| workflow = StateGraph(AgentState) |
|
|
| |
| workflow.add_node("validate_input", validate_query_input_node) |
| workflow.add_node("check_cache", check_cache_node) |
|
|
| |
| workflow.add_node("connection_selection", connection_selection_node) |
| workflow.add_node("validate_connection", validate_connection_input_node) |
| workflow.add_node("postgresql_connection", postgresql_connection_node) |
| workflow.add_node("csv_processing", csv_processing_node) |
| workflow.add_node("create_database", create_database_from_dataframe_node) |
| workflow.add_node("load_database", load_existing_database_node) |
|
|
| workflow.add_node("validate_processing", validate_processing_input_node) |
| workflow.add_node("process_initial_context", process_initial_context_node) |
| workflow.add_node("prepare_context", prepare_query_context_node) |
| workflow.add_node("get_db_sample", get_database_sample_node) |
|
|
| |
| workflow.add_node("process_query", process_user_query_node) |
|
|
| |
| workflow.add_node("graph_selection", graph_selection_node) |
| workflow.add_node("graph_generation", graph_generation_node) |
|
|
| |
| workflow.add_node("refine_response", refine_response_node) |
| workflow.add_node("format_response", format_final_response_node) |
|
|
| |
| workflow.add_node("cache_response", cache_response_node) |
| workflow.add_node("update_history", update_history_node) |
|
|
| |
| workflow.set_entry_point("validate_input") |
|
|
| |
| workflow.add_edge("validate_input", "check_cache") |
|
|
| |
| workflow.add_conditional_edges( |
| "check_cache", |
| route_after_cache_check, |
| { |
| "update_history": "update_history", |
| "validate_processing": "validate_processing", |
| "connection_selection": "connection_selection" |
| } |
| ) |
|
|
| |
| workflow.add_edge("validate_processing", "process_initial_context") |
| workflow.add_edge("process_initial_context", "prepare_context") |
| workflow.add_edge("prepare_context", "connection_selection") |
|
|
| |
| workflow.add_edge("connection_selection", "validate_connection") |
|
|
| |
| workflow.add_conditional_edges( |
| "validate_connection", |
| route_by_connection_type, |
| { |
| "postgresql_connection": "postgresql_connection", |
| "csv_processing": "csv_processing", |
| "load_database": "load_database", |
| "get_db_sample": "get_db_sample" |
| } |
| ) |
|
|
| |
| workflow.add_edge("postgresql_connection", "get_db_sample") |
| workflow.add_edge("csv_processing", "create_database") |
| workflow.add_edge("create_database", "get_db_sample") |
| workflow.add_edge("load_database", "get_db_sample") |
| workflow.add_edge("get_db_sample", "process_query") |
|
|
| |
| workflow.add_conditional_edges( |
| "process_query", |
| should_generate_graph, |
| { |
| "graph_selection": "graph_selection", |
| "refine_response": "refine_response", |
| "cache_response": "cache_response" |
| } |
| ) |
|
|
| |
| workflow.add_edge("graph_selection", "graph_generation") |
|
|
| |
| workflow.add_conditional_edges( |
| "graph_generation", |
| should_refine_response, |
| { |
| "refine_response": "refine_response", |
| "cache_response": "cache_response" |
| } |
| ) |
|
|
| workflow.add_edge("refine_response", "format_response") |
| workflow.add_edge("format_response", "cache_response") |
| workflow.add_edge("cache_response", "update_history") |
| workflow.add_edge("update_history", END) |
|
|
| |
| memory = MemorySaver() |
| self.app = workflow.compile(checkpointer=memory) |
|
|
| logging.info("Grafo LangGraph construído com sucesso") |
|
|
| except Exception as e: |
| logging.error(f"Erro ao construir grafo: {e}") |
| raise |
| |
| async def process_query( |
| self, |
| user_input: str, |
| selected_model: str = "GPT-4o-mini", |
| advanced_mode: bool = False, |
| processing_enabled: bool = False, |
| processing_model: str = "GPT-4o-mini", |
| connection_type: str = "csv", |
| postgresql_config: Optional[Dict] = None, |
| selected_table: str = None, |
| single_table_mode: bool = False, |
| thread_id: str = "default" |
| ) -> Dict[str, Any]: |
| """ |
| Processa uma query do usuário através do grafo |
| |
| Args: |
| user_input: Entrada do usuário |
| selected_model: Modelo LLM selecionado |
| advanced_mode: Se deve usar refinamento avançado |
| processing_enabled: Se deve usar o Processing Agent |
| processing_model: Modelo para o Processing Agent |
| connection_type: Tipo de conexão ("csv" ou "postgresql") |
| postgresql_config: Configuração PostgreSQL (se aplicável) |
| selected_table: Tabela selecionada (para PostgreSQL) |
| single_table_mode: Se deve usar apenas uma tabela (PostgreSQL) |
| thread_id: ID da thread para checkpoint |
| |
| Returns: |
| Resultado do processamento |
| """ |
| try: |
| |
| current_sql_agent = self.object_manager.get_sql_agent(self.agent_id) |
| if current_sql_agent and current_sql_agent.model_name != selected_model: |
| logging.info(f"Recriando agente SQL com modelo {selected_model}") |
|
|
| |
| db_id = self.object_manager.get_db_id_for_agent(self.agent_id) |
| if db_id: |
| db = self.object_manager.get_database(db_id) |
| if db: |
| new_sql_agent = SQLAgentManager(db, selected_model, single_table_mode=False, selected_table=None) |
| self.agent_id = self.object_manager.store_sql_agent(new_sql_agent, db_id) |
| logging.info(f"Agente SQL recriado com sucesso para modelo {selected_model}") |
| else: |
| logging.error("Banco de dados não encontrado para recriar agente") |
| else: |
| logging.error("ID do banco de dados não encontrado para o agente") |
|
|
| |
| logging.info(f"[MAIN GRAPH] ===== INICIANDO PROCESSAMENTO DE QUERY =====") |
| logging.info(f"[MAIN GRAPH] User input: {user_input}") |
| logging.info(f"[MAIN GRAPH] Selected model: {selected_model}") |
| logging.info(f"[MAIN GRAPH] Advanced mode: {advanced_mode}") |
| logging.info(f"[MAIN GRAPH] Processing enabled: {processing_enabled}") |
| logging.info(f"[MAIN GRAPH] Processing model: {processing_model}") |
| logging.info(f"[MAIN GRAPH] Connection type: {connection_type}") |
| if postgresql_config: |
| logging.info(f"[MAIN GRAPH] PostgreSQL config: {postgresql_config['host']}:{postgresql_config['port']}/{postgresql_config['database']}") |
| if selected_table: |
| logging.info(f"[MAIN GRAPH] Selected table: {selected_table}") |
| logging.info(f"[MAIN GRAPH] Single table mode: {single_table_mode}") |
|
|
| |
| initial_state = { |
| "user_input": user_input, |
| "selected_model": selected_model, |
| "response": "", |
| "advanced_mode": advanced_mode, |
| "execution_time": 0.0, |
| "error": None, |
| "intermediate_steps": [], |
| "db_sample_dict": {}, |
| |
| "agent_id": self.agent_id, |
| "engine_id": self.engine_id, |
| "db_id": self.db_id, |
| "cache_id": self.cache_id, |
| |
| "query_type": "sql_query", |
| "sql_query_extracted": None, |
| "graph_type": None, |
| "graph_data": None, |
| "graph_image_id": None, |
| "graph_generated": False, |
| "graph_error": None, |
| |
| "cache_hit": False, |
| |
| "processing_enabled": processing_enabled, |
| "processing_model": processing_model, |
| "processing_agent_id": None, |
| "suggested_query": None, |
| "query_observations": None, |
| "processing_result": None, |
| "processing_success": False, |
| "processing_error": None, |
| |
| "refined": False, |
| "refinement_error": None, |
| "refinement_quality": None, |
| "quality_metrics": None, |
| |
| "sql_context": None, |
| "sql_result": None, |
| |
| "connection_type": connection_type, |
| "postgresql_config": postgresql_config, |
| "selected_table": selected_table, |
| "single_table_mode": single_table_mode, |
| "connection_success": self.db_id is not None, |
| "connection_error": None, |
| "connection_info": None |
| } |
| |
| |
| config = {"configurable": {"thread_id": thread_id}} |
| result = await self.app.ainvoke(initial_state, config=config) |
| |
| logging.info(f"Query processada com sucesso: {user_input[:50]}...") |
| return result |
| |
| except Exception as e: |
| error_msg = f"Erro ao processar query: {e}" |
| logging.error(error_msg) |
| return { |
| "user_input": user_input, |
| "response": error_msg, |
| "error": error_msg, |
| "execution_time": 0.0 |
| } |
| |
| async def handle_csv_upload(self, file_path: str) -> Dict[str, Any]: |
| """ |
| Processa upload de CSV usando nova arquitetura de nós |
| |
| Args: |
| file_path: Caminho do arquivo CSV |
| |
| Returns: |
| Resultado do upload |
| """ |
| try: |
| |
| csv_state = { |
| "file_path": file_path, |
| "success": False, |
| "message": "", |
| "csv_data_sample": {}, |
| "column_info": {}, |
| "processing_stats": {} |
| } |
|
|
| csv_result = await csv_processing_node(csv_state) |
|
|
| if not csv_result["success"]: |
| return csv_result |
|
|
| |
| db_state = csv_result.copy() |
| db_result = await create_database_from_dataframe_node(db_state) |
|
|
| if not db_result["success"]: |
| return db_result |
|
|
| |
| if db_result["success"]: |
| |
| self.engine_id = db_result["engine_id"] |
| self.db_id = db_result["db_id"] |
|
|
| |
| new_engine = self.object_manager.get_engine(self.engine_id) |
| new_db = self.object_manager.get_database(self.db_id) |
| new_sql_agent = SQLAgentManager(new_db, single_table_mode=False, selected_table=None) |
|
|
| |
| self.agent_id = self.object_manager.store_sql_agent(new_sql_agent, self.db_id) |
|
|
| |
| cache_manager = self.object_manager.get_cache_manager(self.cache_id) |
| if cache_manager: |
| cache_manager.clear_cache() |
|
|
| logging.info("[UPLOAD] Sistema atualizado com novo CSV") |
|
|
| return db_result |
|
|
| except Exception as e: |
| error_msg = f"❌ Erro no upload de CSV: {e}" |
| logging.error(error_msg) |
| return { |
| "success": False, |
| "message": error_msg |
| } |
|
|
| async def handle_postgresql_connection(self, state: Dict[str, Any]) -> Dict[str, Any]: |
| """ |
| Processa conexão PostgreSQL usando nova arquitetura de nós |
| |
| Args: |
| state: Estado contendo configuração PostgreSQL |
| |
| Returns: |
| Resultado da conexão |
| """ |
| try: |
| |
| state.update({ |
| "success": False, |
| "message": "", |
| "connection_info": {}, |
| "connection_error": None, |
| "connection_success": False |
| }) |
|
|
| |
| pg_result = await postgresql_connection_node(state) |
|
|
| if not pg_result["success"]: |
| return pg_result |
|
|
| |
| if pg_result["success"]: |
| |
| self.engine_id = pg_result["engine_id"] |
| self.db_id = pg_result["db_id"] |
|
|
| |
| new_engine = self.object_manager.get_engine(self.engine_id) |
| new_db = self.object_manager.get_database(self.db_id) |
|
|
| |
| single_table_mode = state.get("single_table_mode", False) |
| selected_table = state.get("selected_table") |
| selected_model = state.get("selected_model", "gpt-4o-mini") |
|
|
| new_sql_agent = SQLAgentManager( |
| new_db, |
| selected_model, |
| single_table_mode=single_table_mode, |
| selected_table=selected_table |
| ) |
|
|
| |
| self.agent_id = self.object_manager.store_sql_agent(new_sql_agent, self.db_id) |
|
|
| |
| connection_info = pg_result.get("connection_info", {}) |
| self.object_manager.store_connection_metadata(self.db_id, connection_info) |
|
|
| |
| cache_manager = self.object_manager.get_cache_manager(self.cache_id) |
| if cache_manager: |
| cache_manager.clear_cache() |
|
|
| logging.info("[POSTGRESQL] Sistema atualizado com nova conexão PostgreSQL") |
|
|
| return pg_result |
|
|
| except Exception as e: |
| error_msg = f"❌ Erro na conexão PostgreSQL: {e}" |
| logging.error(error_msg) |
| return { |
| "success": False, |
| "message": error_msg |
| } |
|
|
| async def reset_system(self) -> Dict[str, Any]: |
| """ |
| Reseta o sistema ao estado inicial |
| |
| Returns: |
| Resultado do reset |
| """ |
| try: |
| |
| state = { |
| "success": False, |
| "message": "", |
| "engine_id": self.engine_id, |
| "agent_id": self.agent_id, |
| "cache_id": self.cache_id |
| } |
|
|
| result = await self.custom_node_manager.execute_node("system_reset", state) |
|
|
| |
| if result.get("success"): |
| self.engine_id = result.get("engine_id", self.engine_id) |
| self.agent_id = result.get("agent_id", self.agent_id) |
| |
|
|
| logging.info("[RESET] Sistema resetado com sucesso") |
|
|
| return result |
|
|
| except Exception as e: |
| error_msg = f"❌ Erro ao resetar sistema: {e}" |
| logging.error(error_msg) |
| return { |
| "success": False, |
| "message": error_msg |
| } |
| |
| def toggle_advanced_mode(self, enabled: bool) -> str: |
| """ |
| Alterna modo avançado |
| |
| Args: |
| enabled: Se deve habilitar modo avançado |
| |
| Returns: |
| Mensagem de status |
| """ |
| message = "Modo avançado ativado." if enabled else "Modo avançado desativado." |
| logging.info(f"[MODO AVANÇADO] {'Ativado' if enabled else 'Desativado'}") |
| return message |
| |
| def get_history(self) -> list: |
| """ |
| Retorna histórico de conversas |
| |
| Returns: |
| Lista com histórico |
| """ |
| return self.cache_manager.get_history() |
| |
| def clear_cache(self): |
| """Limpa cache do sistema""" |
| self.cache_manager.clear_cache() |
| logging.info("Cache limpo") |
| |
| async def get_system_info(self) -> Dict[str, Any]: |
| """ |
| Obtém informações do sistema |
| |
| Returns: |
| Informações do sistema |
| """ |
| state = { |
| "engine": self.engine, |
| "sql_agent": self.sql_agent, |
| "cache_manager": self.cache_manager |
| } |
| |
| result = await self.custom_node_manager.execute_node("system_info", state) |
| return result.get("system_info", {}) |
| |
| async def validate_system(self) -> Dict[str, Any]: |
| """ |
| Valida o estado do sistema |
| |
| Returns: |
| Resultado da validação |
| """ |
| state = { |
| "engine": self.engine, |
| "sql_agent": self.sql_agent, |
| "cache_manager": self.cache_manager |
| } |
| |
| result = await self.custom_node_manager.execute_node("system_validation", state) |
| return result.get("validation", {}) |
|
|
| def _smart_type_conversion(self, df, sql_types): |
| """ |
| Conversão inteligente de tipos de dados com suporte a formatos brasileiros |
| """ |
| import re |
|
|
| logging.info("[TYPE_CONVERSION] 🔧 Iniciando conversão inteligente de tipos") |
|
|
| for col in df.columns: |
| col_data = df[col].dropna() |
|
|
| if len(col_data) == 0: |
| continue |
|
|
| |
| sample = col_data.head(100).astype(str) |
|
|
| logging.debug(f"[TYPE_CONVERSION] 📊 Analisando coluna: {col}") |
|
|
| |
| if self._is_date_column(sample): |
| try: |
| df[col] = self._convert_to_date(df[col]) |
| sql_types[col] = DateTime |
| logging.debug(f"[TYPE_CONVERSION] ✅ {col} → DATETIME") |
| continue |
| except Exception as e: |
| logging.warning(f"[TYPE_CONVERSION] ⚠️ Falha ao converter {col} para data: {e}") |
|
|
| |
| if self._is_integer_column(sample): |
| try: |
| |
| def clean_integer(value): |
| if pd.isna(value): |
| return None |
| value_str = str(value).strip() |
| |
| clean_value = ''.join(c for c in value_str if c.isdigit() or c == '-') |
| if clean_value and clean_value != '-': |
| return int(clean_value) |
| return None |
|
|
| df[col] = df[col].apply(clean_integer).astype('Int64') |
| sql_types[col] = Integer |
| logging.debug(f"[TYPE_CONVERSION] ✅ {col} → INTEGER") |
| continue |
| except Exception as e: |
| logging.warning(f"[TYPE_CONVERSION] ⚠️ Falha ao converter {col} para inteiro: {e}") |
|
|
| |
| if self._is_monetary_column(sample): |
| try: |
| df[col] = self._convert_to_monetary(df[col]) |
| sql_types[col] = Float |
| logging.debug(f"[TYPE_CONVERSION] ✅ {col} → FLOAT (monetário)") |
| continue |
| except Exception as e: |
| logging.warning(f"[TYPE_CONVERSION] ⚠️ Falha ao converter {col} para monetário: {e}") |
|
|
| |
| if self._is_float_column(sample): |
| try: |
| df[col] = self._convert_to_float(df[col]) |
| sql_types[col] = Float |
| logging.debug(f"[TYPE_CONVERSION] ✅ {col} → FLOAT") |
| continue |
| except Exception as e: |
| logging.warning(f"[TYPE_CONVERSION] ⚠️ Falha ao converter {col} para float: {e}") |
|
|
| |
| logging.debug(f"[TYPE_CONVERSION] 📝 {col} → TEXT (padrão)") |
|
|
| |
| type_summary = {} |
| for col, sql_type in sql_types.items(): |
| type_name = sql_type.__name__ if hasattr(sql_type, '__name__') else str(sql_type).split('.')[-1].replace('>', '') |
| if type_name not in type_summary: |
| type_summary[type_name] = 0 |
| type_summary[type_name] += 1 |
|
|
| summary_text = ", ".join([f"{count} {type_name}" for type_name, count in type_summary.items()]) |
| logging.info(f"[TYPE_CONVERSION] ✅ Conversão concluída: {summary_text}") |
| return df |
|
|
| def _is_date_column(self, sample): |
| """Detecta se uma coluna contém datas BASEADO APENAS NOS VALORES""" |
| import re |
|
|
| |
| date_patterns = [ |
| r'^\d{1,2}[\/\-\.]\d{1,2}[\/\-\.]\d{4}$', |
| r'^\d{4}[\/\-\.]\d{1,2}[\/\-\.]\d{1,2}$', |
| r'^\d{1,2}[\/\-\.]\d{1,2}[\/\-\.]\d{2}$', |
| ] |
|
|
| |
| date_count = 0 |
| for value in sample: |
| if pd.isna(value) or value == '': |
| continue |
| for pattern in date_patterns: |
| if re.match(pattern, str(value).strip()): |
| date_count += 1 |
| break |
|
|
| return date_count / len(sample) >= 0.7 |
|
|
| def _is_monetary_column(self, sample): |
| """Detecta se uma coluna contém valores monetários BASEADO APENAS NOS VALORES""" |
| import re |
|
|
| |
| money_patterns = [ |
| r'^R\$\s*\d+[,\.]\d{2}$', |
| r'^\d+[,\.]\d{2}$', |
| r'^R\$\s*\d+$', |
| r'^\$\s*\d+[,\.]\d{2}$', |
| r'^\$\s*\d+$', |
| ] |
|
|
| |
| money_count = 0 |
| for value in sample: |
| if pd.isna(value) or value == '': |
| continue |
| value_str = str(value).strip() |
| for pattern in money_patterns: |
| if re.match(pattern, value_str): |
| money_count += 1 |
| break |
|
|
| return money_count / len(sample) >= 0.6 |
|
|
| def _is_integer_column(self, sample): |
| """Detecta se uma coluna contém números inteiros""" |
| try: |
| |
| has_decimal_separators = False |
| valid_numeric_count = 0 |
| integer_count = 0 |
|
|
| for value in sample: |
| if pd.isna(value) or value == '': |
| continue |
|
|
| value_str = str(value).strip() |
|
|
| |
| if (',' in value_str and any(c.isdigit() for c in value_str.split(',')[-1])) or \ |
| ('.' in value_str and any(c.isdigit() for c in value_str.split('.')[-1])): |
| has_decimal_separators = True |
| break |
|
|
| |
| try: |
| |
| clean_value = ''.join(c for c in value_str if c.isdigit() or c == '-') |
| if clean_value and clean_value != '-': |
| num_value = int(clean_value) |
| valid_numeric_count += 1 |
| integer_count += 1 |
| except: |
| |
| try: |
| float_value = float(value_str) |
| valid_numeric_count += 1 |
| |
| if float_value == int(float_value): |
| integer_count += 1 |
| except: |
| continue |
|
|
| |
| if has_decimal_separators: |
| return False |
|
|
| |
| if valid_numeric_count == 0 or valid_numeric_count / len(sample) < 0.8: |
| return False |
|
|
| |
| return integer_count / valid_numeric_count >= 0.95 |
|
|
| except Exception as e: |
| logging.debug(f"Erro na detecção de inteiros: {e}") |
| return False |
|
|
| def _is_float_column(self, sample): |
| """Detecta se uma coluna contém números decimais (com vírgula ou ponto)""" |
| try: |
| has_decimal_values = False |
| valid_numeric_count = 0 |
|
|
| for value in sample: |
| if pd.isna(value) or value == '': |
| continue |
|
|
| value_str = str(value).strip() |
|
|
| |
| if (',' in value_str and any(c.isdigit() for c in value_str.split(',')[-1])) or \ |
| ('.' in value_str and any(c.isdigit() for c in value_str.split('.')[-1])): |
| has_decimal_values = True |
|
|
| |
| try: |
| clean_value = value_str.replace(',', '.') |
| float(clean_value) |
| valid_numeric_count += 1 |
| except: |
| continue |
|
|
| |
| if not has_decimal_values: |
| return False |
|
|
| return valid_numeric_count / len(sample) >= 0.8 |
|
|
| except Exception as e: |
| logging.debug(f"Erro na detecção de floats: {e}") |
| return False |
|
|
| def _convert_to_date(self, series): |
| """Converte série para datetime com formatos brasileiros""" |
| |
| date_formats = [ |
| '%d/%m/%Y', |
| '%d-%m-%Y', |
| '%d.%m.%Y', |
| '%Y-%m-%d', |
| '%Y/%m/%d', |
| '%d/%m/%y', |
| ] |
|
|
| for fmt in date_formats: |
| try: |
| return pd.to_datetime(series, format=fmt, errors='raise') |
| except: |
| continue |
|
|
| |
| try: |
| return pd.to_datetime(series, dayfirst=True, errors='coerce') |
| except: |
| raise ValueError("Não foi possível converter para data") |
|
|
| def _convert_to_monetary(self, series): |
| """Converte série para valores monetários (float)""" |
| def clean_monetary(value): |
| if pd.isna(value): |
| return None |
|
|
| |
| value_str = str(value).strip() |
|
|
| |
| value_str = value_str.replace('R$', '').replace('$', '').strip() |
|
|
| |
| if ',' in value_str and '.' in value_str: |
| |
| value_str = value_str.replace('.', '').replace(',', '.') |
| elif ',' in value_str: |
| |
| value_str = value_str.replace(',', '.') |
|
|
| try: |
| return float(value_str) |
| except: |
| return None |
|
|
| return series.apply(clean_monetary) |
|
|
| def _convert_to_float(self, series): |
| """Converte série para float com formato brasileiro""" |
| def clean_float(value): |
| if pd.isna(value): |
| return None |
|
|
| value_str = str(value).strip() |
|
|
| |
| if ',' in value_str: |
| value_str = value_str.replace(',', '.') |
|
|
| try: |
| return float(value_str) |
| except: |
| return None |
|
|
| return series.apply(clean_float) |
|
|
| |
| _graph_manager: Optional[AgentGraphManager] = None |
|
|
| def get_graph_manager() -> AgentGraphManager: |
| """ |
| Retorna instância singleton do gerenciador de grafo |
| |
| Returns: |
| AgentGraphManager |
| """ |
| global _graph_manager |
| if _graph_manager is None: |
| _graph_manager = AgentGraphManager() |
| return _graph_manager |
|
|
| async def initialize_graph() -> AgentGraphManager: |
| """ |
| Inicializa o grafo principal |
| |
| Returns: |
| AgentGraphManager inicializado |
| """ |
| try: |
| manager = get_graph_manager() |
| |
| |
| validation = await manager.validate_system() |
| if not validation.get("overall_valid", False): |
| logging.warning("Sistema não passou na validação completa") |
| |
| logging.info("Grafo principal inicializado e validado") |
| return manager |
| |
| except Exception as e: |
| logging.error(f"Erro ao inicializar grafo: {e}") |
| raise |
|
|
| |
|
|