File size: 8,581 Bytes

"""
Streaming & Async Engine — Real-time token streaming and concurrent execution.

Adds streaming support to all modules:
  - Actor streams its thought process as it reasons
  - Purpose Function streams its evaluation
  - Orchestrator streams step-by-step progress

Async support via asyncio:
  - All core operations have async variants
  - Concurrent tool execution
  - Background experience replay updates

Pattern: sync methods remain the default. Async wrappers use asyncio.to_thread
for backends that don't support native async (per smolagents pattern).
"""

from __future__ import annotations

import asyncio
import json
import logging
import time
from typing import Any, AsyncIterator, Callable, Iterator

from purpose_agent.types import (
    Action, PurposeScore, State, Trajectory, TrajectoryStep,
)
from purpose_agent.llm_backend import ChatMessage, LLMBackend

logger = logging.getLogger(__name__)


# ---------------------------------------------------------------------------
# Streaming Mixin — adds generate_stream to any LLMBackend
# ---------------------------------------------------------------------------

class StreamingMixin:
    """
    Mixin that adds streaming to any LLMBackend that doesn't natively support it.
    
    Falls back to returning the full response as a single chunk.
    Override generate_stream() for native streaming.
    """

    def generate_stream(
        self,
        messages: list[ChatMessage],
        temperature: float = 0.7,
        max_tokens: int = 2048,
    ) -> Iterator[str]:
        """
        Stream tokens. Default: generate full response, yield as one chunk.
        Override in subclasses for real token-level streaming.
        """
        full = self.generate(messages, temperature=temperature, max_tokens=max_tokens)
        yield full

    async def agenerate(
        self,
        messages: list[ChatMessage],
        temperature: float = 0.7,
        max_tokens: int = 2048,
        stop: list[str] | None = None,
    ) -> str:
        """Async wrapper around sync generate."""
        return await asyncio.to_thread(
            self.generate, messages, temperature, max_tokens, stop
        )

    async def agenerate_structured(
        self,
        messages: list[ChatMessage],
        schema: dict[str, Any],
        temperature: float = 0.3,
        max_tokens: int = 1024,
    ) -> dict[str, Any]:
        """Async wrapper around sync generate_structured."""
        return await asyncio.to_thread(
            self.generate_structured, messages, schema, temperature, max_tokens
        )

    async def agenerate_stream(
        self,
        messages: list[ChatMessage],
        temperature: float = 0.7,
        max_tokens: int = 2048,
    ) -> AsyncIterator[str]:
        """Async streaming. Default: wrap sync stream in async iterator."""
        loop = asyncio.get_event_loop()
        # Run sync generator in thread, yield results
        gen = self.generate_stream(messages, temperature, max_tokens)
        while True:
            try:
                token = await asyncio.to_thread(next, gen)
                yield token
            except StopIteration:
                break


# ---------------------------------------------------------------------------
# Event types for streaming orchestration
# ---------------------------------------------------------------------------

class StreamEvent:
    """An event emitted during streaming orchestration."""

    def __init__(
        self,
        event_type: str,
        data: dict[str, Any] | None = None,
        step: int = 0,
        token: str = "",
    ):
        self.event_type = event_type  # "step_start", "token", "score", "step_end", "task_end", etc.
        self.data = data or {}
        self.step = step
        self.token = token
        self.timestamp = time.time()

    def __repr__(self) -> str:
        if self.token:
            return f"StreamEvent({self.event_type}, token='{self.token[:20]}')"
        return f"StreamEvent({self.event_type}, step={self.step})"


# ---------------------------------------------------------------------------
# Async Orchestrator — streams events during task execution
# ---------------------------------------------------------------------------

class AsyncOrchestrator:
    """
    Async wrapper around the synchronous Orchestrator that streams events.
    
    Usage:
        async for event in async_orch.run_task_stream(purpose="...", ...):
            if event.event_type == "token":
                print(event.token, end="", flush=True)
            elif event.event_type == "score":
                print(f"\\nΦ: {event.data['phi_before']:.1f} → {event.data['phi_after']:.1f}")
    """

    def __init__(self, orchestrator):
        self.orch = orchestrator

    async def run_task_stream(
        self,
        purpose: str,
        initial_state: State | None = None,
        max_steps: int = 20,
        early_stop_phi: float = 9.0,
    ) -> AsyncIterator[StreamEvent]:
        """Run a task and stream events as they happen."""

        current_state = initial_state or self.orch.environment.reset()
        self.orch.purpose_fn.reset_trajectory_stats()

        trajectory = Trajectory(task_description=purpose, purpose=purpose)
        history: list[dict[str, Any]] = []

        yield StreamEvent("task_start", {"purpose": purpose, "max_steps": max_steps})

        for step_idx in range(max_steps):
            yield StreamEvent("step_start", {"step": step_idx + 1}, step=step_idx + 1)

            # Actor decides (run in thread to not block)
            action = await asyncio.to_thread(
                self.orch.actor.decide, purpose, current_state, history
            )

            yield StreamEvent("action", {
                "name": action.name,
                "thought": action.thought,
                "expected_delta": action.expected_delta,
            }, step=step_idx + 1)

            if action.name.upper() == "DONE":
                yield StreamEvent("done", {}, step=step_idx + 1)
                break

            # Environment executes
            try:
                new_state = await asyncio.to_thread(
                    self.orch.environment.execute, action, current_state
                )
            except Exception as e:
                new_state = State(data={**current_state.data, "_error": str(e)})
                yield StreamEvent("error", {"error": str(e)}, step=step_idx + 1)

            # Purpose Function scores
            score = await asyncio.to_thread(
                self.orch.purpose_fn.evaluate, current_state, action, new_state, purpose
            )

            yield StreamEvent("score", {
                "phi_before": score.phi_before,
                "phi_after": score.phi_after,
                "delta": score.delta,
                "confidence": score.confidence,
                "improved": score.improved,
                "evidence": score.evidence,
            }, step=step_idx + 1)

            # Record step
            step = TrajectoryStep(
                state_before=current_state, action=action, state_after=new_state,
                score=score, step_index=step_idx + 1,
            )
            trajectory.steps.append(step)
            history.append({
                "action": f"{action.name}({json.dumps(action.params, default=str)})",
                "result": new_state.describe()[:200],
                "score": f"Δ={score.delta:+.2f}",
            })

            yield StreamEvent("step_end", {
                "state_summary": new_state.describe()[:200],
            }, step=step_idx + 1)

            if score.phi_after >= early_stop_phi:
                yield StreamEvent("early_stop", {"phi": score.phi_after}, step=step_idx + 1)
                break

            if self.orch.environment.is_terminal(new_state):
                yield StreamEvent("terminal", {}, step=step_idx + 1)
                break

            current_state = new_state

        # Post-task (run in background)
        await asyncio.to_thread(self.orch.post_task, trajectory, [])

        yield StreamEvent("task_end", {
            "total_steps": len(trajectory.steps),
            "cumulative_reward": trajectory.cumulative_reward,
            "success_rate": trajectory.success_rate,
            "final_phi": trajectory.final_phi,
        })

    async def run_task(self, **kwargs):
        """Non-streaming async task execution."""
        from purpose_agent.orchestrator import TaskResult
        result = await asyncio.to_thread(self.orch.run_task, **kwargs)
        return result