Spaces:

iitian
/

open_env

Sleeping

App Files Files Community

open_env / server /environment.py

iitian

fix: update grader scores to fall strictly within (0, 1)

47ab3b8 10 days ago

raw

history blame contribute delete

7.43 kB

	import uuid
	import datetime
	from typing import Optional, Tuple, Dict, Any, List
	from .models import CloudAction, CloudObservation, CloudState, CloudActionType

	class CloudAuditEnv:
	def __init__(self):
	self.task_id = "easy"
	self._initialize_state()

	def _initialize_state(self):
	self.episode_id = str(uuid.uuid4())
	self.step_count = 0
	self.is_completed = False
	self.score = 0.01

	# Mock Infrastructure
	self.resources = {
	"s3": [
	{"id": "prod-data-001", "region": "us-east-1", "public": True, "tags": {"env": "prod"}},
	{"id": "prod-logs-002", "region": "us-east-1", "public": False, "tags": {"env": "prod"}},
	{"id": "dev-test-01", "region": "us-west-2", "public": True, "tags": {"env": "dev"}},
	],
	"ec2": [
	{"id": "i-0abcdef1234567890", "type": "t2.micro", "state": "running", "tags": {"env": "dev"},
	"security_groups": [{"id": "sg-01", "rules": [{"port": 22, "cidr": "0.0.0.0/0"}, {"port": 3389, "cidr": "0.0.0.0/0"}]}]},
	{"id": "i-0987654321fedcba0", "type": "m5.large", "state": "running", "tags": {"env": "prod"},
	"security_groups": [{"id": "sg-02", "rules": [{"port": 443, "cidr": "0.0.0.0/0"}]}]},
	],
	"logs": {
	"auth-logs": [
	{"timestamp": "2026-04-05T10:00:00Z", "user": "admin", "action": "Login", "ip": "1.1.1.1"},
	{"timestamp": "2026-04-05T10:15:00Z", "user": "iam-role-01", "action": "DeleteStorage", "ip": "192.168.1.50"},
	{"timestamp": "2026-04-05T10:30:00Z", "user": "user-02", "action": "ListBuckets", "ip": "2.2.2.2"},
	]
	}
	}

	def reset(self, task_id: str = "easy") -> CloudObservation:
	"""Required by openenv-core 0.1.1: takes task_id, returns JUST the observation."""
	self.task_id = task_id
	self._initialize_state()
	return CloudObservation(info=f"Environment reset. Task: {self.task_id}", reward=0.01, done=False)

	def step(self, action: CloudAction) -> CloudObservation:
	"""Required by openenv-core 0.1.1: takes action, returns JUST the observation with reward/done fields."""
	try:
	self.step_count += 1
	reward = 0.005
	terminated = False
	truncated = self.step_count >= 20 # Limit steps

	obs = CloudObservation()

	if action.action == CloudActionType.LIST:
	r_type = action.resource_type
	if r_type in self.resources:
	obs.resources = self.resources[r_type]
	obs.status = f"Listed {len(obs.resources)} {r_type} resources."
	else:
	obs.status = f"Unknown resource type: {r_type}"

	elif action.action == CloudActionType.DESCRIBE:
	res_id = action.resource_id
	found = False
	for r_type in ["s3", "ec2"]:
	for r in self.resources[r_type]:
	if r["id"] == res_id:
	obs.details = r
	obs.status = f"Described resource {res_id}"
	found = True
	break
	if not found:
	obs.status = f"Resource not found: {res_id}"

	elif action.action == CloudActionType.MODIFY:
	res_id = action.resource_id
	patch = action.patch
	# Simple EC2 security group patching for Medium task
	if self.task_id == "medium" and res_id == "i-0abcdef1234567890":
	for sg in self.resources["ec2"][0]["security_groups"]:
	if patch and "rules" in patch:
	sg["rules"] = patch["rules"]
	obs.status = f"Updated security groups for EC2 instance {res_id}"
	# Check for reward
	rules = self.resources["ec2"][0]["security_groups"][0]["rules"]
	has_rdp = any(r["port"] == 3389 and r["cidr"] == "0.0.0.0/0" for r in rules)
	if not has_rdp:
	reward = 0.85
	terminated = True
	obs.info = "Success! Port 3389 removed. Task completed."
	else:
	obs.info = "Port 3389 is still open. Remove it by omitting it from the rules list."
	elif self.task_id == "medium":
	obs.status = f"Invalid resource ID '{res_id}'. Use the EC2 instance ID 'i-0abcdef1234567890', not the security group ID."
	else:
	obs.status = "Action not permitted or invalid resource."

	elif action.action == CloudActionType.LOGS:
	log_name = action.resource_id
	if log_name in self.resources["logs"]:
	obs.logs = self.resources["logs"][log_name]
	obs.status = f"Fetched logs for {log_name}"
	else:
	obs.status = f"Logs not found: {log_name}"

	elif action.action == CloudActionType.SUBMIT:
	# For Easy and Hard tasks
	if self.task_id == "easy":
	# Expecting agent to list public S3 buckets in prod
	if action.answer:
	answers = [a.strip() for a in action.answer.split(",")]
	expected = ["prod-data-001"]
	if set(answers) == set(expected):
	reward = 0.85
	terminated = True
	obs.info = "Correct! Task completed."
	else:
	obs.info = f"Incorrect. Expected the public prod S3 bucket ID. Got: {answers}"

	elif self.task_id == "hard":
	# Expecting rogue IP from auth-logs
	if action.answer and action.answer.strip() == "192.168.1.50":
	reward = 0.85
	terminated = True
	obs.info = "Correct! Rogue IP identified. Task completed."
	else:
	obs.info = f"Wrong IP address. Got: {action.answer}. Check the auth-logs for the DeleteStorage action."

	elif self.task_id == "medium":
	obs.info = "For the medium task, use the 'modify' action to update the EC2 security group, not 'submit'."

	self.score = min(0.99, self.score + reward)
	obs.reward = reward
	obs.done = terminated or truncated
	return obs
	except Exception as e:
	import sys
	import traceback
	print(f"ERROR in environment.step: {str(e)}", file=sys.stderr)
	traceback.print_exc(file=sys.stderr)
	return CloudObservation(status=f"Internal Server Error: {str(e)}", reward=0.01, done=True)

	def state(self) -> CloudState:
	return CloudState(
	episode_id=self.episode_id,
	step_count=self.step_count,
	task_id=self.task_id,
	is_completed=self.is_completed,
	score=self.score
	)