Spaces:
Sleeping
Sleeping
File size: 1,784 Bytes
b1100bc | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 | """StabilizerForge environment client (sync + async via openenv core)."""
from __future__ import annotations
from typing import Any
from openenv.core import EnvClient
from openenv.core.client_types import StepResult
from openenv.core.env_server.types import State
from .models import StabilizerAction, StabilizerObservation
class StabilizerForgeEnv(EnvClient[StabilizerAction, StabilizerObservation, State]):
"""Client for the StabilizerForge environment server.
Example:
with StabilizerForgeEnv(base_url="http://localhost:8000") as client:
result = client.reset(task_id="steane_7_1_3")
result = client.step(StabilizerAction(op="H", qubits=[0]))
...
result = client.step(StabilizerAction(op="FINALIZE"))
"""
def _step_payload(self, action: StabilizerAction) -> dict[str, Any]:
return {"op": action.op, "qubits": list(action.qubits)}
def _parse_result(
self, payload: dict[str, Any]
) -> StepResult[StabilizerObservation]:
obs_data = payload.get("observation", {})
observation = StabilizerObservation(**obs_data) if obs_data else StabilizerObservation()
# Top-level done/reward override what's inside observation if present
if "done" in payload:
observation.done = bool(payload.get("done"))
if "reward" in payload:
observation.reward = payload.get("reward")
return StepResult(
observation=observation,
reward=payload.get("reward"),
done=payload.get("done", False),
)
def _parse_state(self, payload: dict[str, Any]) -> State:
return State(
episode_id=payload.get("episode_id"),
step_count=payload.get("step_count", 0),
)
|