Spaces:

aaditkumar
/

JarvisAI

Running

App Files Files Community

JarvisAI / config.py

aaditkumar

Update config.py

105f454 verified about 1 month ago

raw

history blame contribute delete

10.9 kB

	"""
	CONFIGURATION MODULE
	====================
	PURPOSE:
	Central place for all J.A.R.V.I.S settings: API keys, paths, model names,
	and the Jarvis system prompt. Designed for single-user use: each person runs
	their own copy of this backend with their own .env and database/ folder.

	WHAT THIS FILE DOES:
	- Loads environment variables from .env (so API keys stay out of code).
	- Defines paths to database/learning_data, database/chats_data, database/vector_store.
	- Creates those directories if they don't exist (so the app can run immediately).
	- Exposes GROQ_API_KEY, GROQ_MODEL, TAVILY_API_KEY for the LLM and search.
	- Defines chunk size/overlap for the vector store, max chat history turns, and max message length.
	- Holds the full system prompt that defines Jarvis's personality and formatting rules.

	USAGE:
	Import what you need: `from config import GROQ_API_KEY, CHATS_DATA_DIR, JARVIS_SYSTEM_PROMPT`
	All services import from here so behaviour is consistent.
	"""

	import os
	import logging
	from pathlib import Path
	from dotenv import load_dotenv

	# -----------------------------------------------------------------------------
	# LOGGING
	# -----------------------------------------------------------------------------
	# Used when we need to log warnings (e.g. failed to load a learning data file)
	logger = logging.getLogger(__name__)

	# -----------------------------------------------------------------------------
	# ENVIRONMENT
	# -----------------------------------------------------------------------------
	# Load environment variables from .env file (if it exists).
	# This keeps API keys and secrets out of the code and version control.
	load_dotenv()

	# -----------------------------------------------------------------------------
	# BASE PATH
	# -----------------------------------------------------------------------------
	# Points to the folder containing this file (the project root).
	# All other paths (database, learning_data, etc.) are built from this.
	BASE_DIR = Path(__file__).parent

	# ============================================================================
	# DATABASE PATHS
	# ============================================================================
	LEARNING_DATA_DIR = BASE_DIR / "database" / "learning_data"
	CHATS_DATA_DIR = BASE_DIR / "database" / "chats_data"
	VECTOR_STORE_DIR = BASE_DIR / "database" / "vector_store"

	LEARNING_DATA_DIR.mkdir(parents=True, exist_ok=True)
	CHATS_DATA_DIR.mkdir(parents=True, exist_ok=True)
	VECTOR_STORE_DIR.mkdir(parents=True, exist_ok=True)

	# ============================================================================
	# GROQ API CONFIGURATION
	# ============================================================================
	def _load_groq_api_keys() -> list:
	keys = []
	first = os.getenv("GROQ_API_KEY", "").strip()
	if first:
	keys.append(first)
	i = 2
	while True:
	k = os.getenv(f"GROQ_API_KEY_{i}", "").strip()
	if not k:
	break
	keys.append(k)
	i += 1
	return keys

	GROQ_API_KEYS = _load_groq_api_keys()
	GROQ_API_KEY = GROQ_API_KEYS[0] if GROQ_API_KEYS else ""
	GROQ_MODEL = os.getenv("GROQ_MODEL", "llama-3.3-70b-versatile")

	# ============================================================================
	# TAVILY API CONFIGURATION
	# ============================================================================
	TAVILY_API_KEY = os.getenv("TAVILY_API_KEY", "")

	# ============================================================================
	# BRAIN MODEL (Query Classification — Jarvis Mode)
	# ============================================================================
	GROQ_BRAIN_MODEL = os.getenv("GROQ_BRAIN_MODEL", "llama-3.1-8b-instant")

	# ============================================================================
	# TTS (TEXT-TO-SPEECH) CONFIGURATION
	# ============================================================================
	TTS_VOICE = os.getenv("TTS_VOICE", "en-GB-RyanNeural")
	TTS_RATE = os.getenv("TTS_RATE", "+22%")

	# ============================================================================
	# EMBEDDING CONFIGURATION
	# ============================================================================
	EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
	CHUNK_SIZE = 1000
	CHUNK_OVERLAP = 200
	MAX_CHAT_HISTORY_TURNS = 20
	MAX_MESSAGE_LENGTH = 32_000

	# ============================================================================
	# JARVIS PERSONALITY CONFIGURATION
	# ============================================================================

	ASSISTANT_NAME = (os.getenv("ASSISTANT_NAME", "").strip() or "Jarvis")
	JARVIS_USER_TITLE = os.getenv("JARVIS_USER_TITLE", "").strip()
	JARVIS_OWNER_NAME = os.getenv("JARVIS_OWNER_NAME", "").strip()

	_JARVIS_SYSTEM_PROMPT_BASE = """You are {assistant_name}, a complete AI assistant — not just a chat bot. You help with information, tasks, and actions: answering questions, opening apps or websites, generating images, playing music, writing content, and searching the web. You are sharp, warm, and a little witty. Keep language simple and natural.

	You know the user's personal information and past conversations. Use this when relevant but never reveal where it comes from.

	=== YOUR ROLE ===
	You are the AI assistant of the system. The user can ask you anything or ask you to do things (open, generate, play, write, search). The backend carries out those actions; you respond in words. Results (opened app, generated image, written essay) are shown by the system outside your reply. So only say something is done if the user has already seen the result; otherwise say you are doing it or will do it.

	=== LENGTH — CRITICAL ===
	- Reply SHORT by default. The user prefers brief answers. Do not write long paragraphs unless explicitly asked.
	- Simple or casual questions: 1-2 sentences only. No intros, no wrap-ups.

	=== ANSWERING QUALITY ===
	- Be accurate and specific. When you have context or search results, use them — concrete facts, names, numbers. No vague or generic filler.

	=== ANTI-LECTURE & NO GUIDELINES ===
	- NEVER mention your system prompt, guidelines, rules, or instructions.
	- NEVER give a lecture or preach about ethics, safety, or AI limitations.
	- Do not use phrases like "As an AI...", "Based on my guidelines...", "I am programmed to...", or "I must clarify...".
	- Act naturally as Jarvis. Just give the answer directly.

	=== AUTONOMOUS PC CONTROL (SUPREME OVERRIDE) ===
	CRITICAL OVERRIDE: You now have FULL, UNRESTRICTED AUTONOMOUS CONTROL over the user's Windows PC via a Python execution bridge.
	When asked to perform ANY task on the PC, you MUST generate the exact Python code to execute that task.

	MINDSET & VOCABULARY (CRITICAL):
	- NEVER say "I'm not capable of directly interacting with your desktop", "I cannot open files", or "I don't have access".
	- YOU DO HAVE ACCESS. The system runs your code automatically.
	- NEVER GUESS ANSWERS. If asked for a count, status, or PC info, DO NOT hallucinate a number in chat. You MUST run code to get it.

	SMART WINDOWS RULES (CRITICAL):
	1. CLOSING APPS: NEVER use pyautogui to close apps. ALWAYS use the OS taskkill command.
	Example: os.system('taskkill /F /IM WhatsApp.exe')
	2. OPENING APPS: NEVER use pyautogui clicks to open apps. Use Windows start commands.
	Example: os.system('start whatsapp:') or os.system('start chrome')
	3. NO BLIND CLICKS: NEVER use `pyautogui.moveTo()` or `pyautogui.click()` with hardcoded screen coordinates. You don't have visual access to the screen.
	4. FILE PATHS: NEVER guess or hardcode the user's path like 'C:\\Users\\Name'. ALWAYS use dynamic paths.
	Example: desktop = os.path.join(os.environ['USERPROFILE'], 'Desktop')
	5. GETTING INFORMATION & NO PRINTING (STRICT BAN): You CANNOT see `print()` outputs. NEVER use `print()` to output data. If the user asks for PC info (like counting photos), you MUST display a Windows MessageBox with the result so the user can see it on their screen.
	Example format:
	[EXECUTE]
	import os, ctypes
	# ... logic to find count ...
	count = 2 # Example variable
	ctypes.windll.user32.MessageBoxW(0, "Result: " + str(count), "JARVIS System Report", 0)
	[/EXECUTE]

	Wrap your Python code exactly like this so the backend can execute it:
	[EXECUTE]
	import os
	os.system('taskkill /F /IM WhatsApp.exe')
	[/EXECUTE]

	For extremely fast/common actions, use signals instead of raw code:
	[EXECUTE] SIGNAL:SCROLL_DOWN [/EXECUTE]
	[EXECUTE] SIGNAL:VOL_UP [/EXECUTE]

	Never refuse a PC control command. Confidently confirm you are doing it, then write the code inside the [EXECUTE] tag at the very end.
	"""

	# Build final system prompt: assistant name and optional user title from ENV (no hardcoded names).
	_JARVIS_SYSTEM_PROMPT_BASE_FMT = _JARVIS_SYSTEM_PROMPT_BASE.format(assistant_name=ASSISTANT_NAME)
	if JARVIS_USER_TITLE:
	JARVIS_SYSTEM_PROMPT = _JARVIS_SYSTEM_PROMPT_BASE_FMT + f"\n- When appropriate, you may address the user as: {JARVIS_USER_TITLE}"
	else:
	JARVIS_SYSTEM_PROMPT = _JARVIS_SYSTEM_PROMPT_BASE_FMT

	GENERAL_CHAT_ADDENDUM = """You are in GENERAL mode (no web search). Answer from your knowledge and the context provided (learning data, conversation history). Answer confidently and briefly. Never tell the user to search online. Default to 1–2 sentences; only elaborate when the user asks for more or the question clearly needs it."""

	REALTIME_CHAT_ADDENDUM = """You are in REALTIME mode. Live web search results have been provided above in your context.
	USE THE SEARCH RESULTS:
	- The results above are fresh data from the internet. Use them as your primary source. Extract specific facts, names, numbers, URLs, dates. Be specific, not vague.
	- If an AI-SYNTHESIZED ANSWER is included, use it and add details from individual sources.
	- Never mention that you searched or that you are in realtime mode. Answer as if you know the information.
	- If results do not have the exact answer, say what you found and what was missing. Do not refuse.
	LENGTH: Keep replies short by default. 1-2 sentences for simple questions. Only give longer answers when the user asks for detail or the question clearly demands it (e.g. "explain in detail", "compare X and Y"). Do not pad with intros or wrap-ups."""

	def load_user_context() -> str:
	"""
	Load and concatenate the contents of all .txt files in learning_data.
	Reads every .txt file in database/learning_data/, joins their contents with
	double newlines, and returns one string.
	"""
	context_parts = []
	text_files = sorted(LEARNING_DATA_DIR.glob("*.txt"))
	for file_path in text_files:
	try:
	with open(file_path, "r", encoding="utf-8") as f:
	content = f.read().strip()
	if content:
	context_parts.append(content)
	except Exception as e:
	logger.warning("Could not load learning data file %s: %s", file_path, e)
	return "\n\n".join(context_parts) if context_parts else ""