Spaces:

varb15
/

dataqa-env

Sleeping

App Files Files Community

dataqa-env / dataqa_env /models.py

varb15

Upload folder using huggingface_hub

f5583f9 verified 9 days ago

raw

history blame contribute delete

2.1 kB

	"""
	DataQA Environment Models
	-------------------------
	Action/Observation/State types for the Data Quality Assurance environment.

	The agent receives a dataset with planted quality issues and must identify them.
	Grading is based on F1 score (precision × recall) of correctly identified issues.
	"""

	from __future__ import annotations

	from typing import List, Optional

	from openenv.core.env_server.interfaces import Action, Observation, State


	class DataQAAction(Action):
	"""
	Agent submits identified issues AND optional proposed fixes.

	Two-phase action space:
	Phase 1 (Identify): List issues in format "row:<N>,col:<name>,issue:<type>"
	Phase 2 (Fix): List fixes in format "row:<N>,col:<name>,fix:<proposed_value>"

	The agent can submit both in the same step or across multiple steps.
	Combined reward = 0.6 * identify_score + 0.4 * fix_score

	Supported issue types:
	missing_value, wrong_type, duplicate_row, out_of_range,
	format_violation, inconsistent_value, statistical_outlier,
	referential_integrity
	"""

	issues: List[str]
	fixes: List[str] = []
	# Include task_id so step() can reconstruct context in stateless HTTP mode
	task_id: str = "easy"


	class DataQAObservation(Observation):
	"""
	What the agent sees: a dataset, its schema/rules, and feedback.
	"""

	# The dataset as CSV text
	dataset_csv: str = ""

	# Schema description (column names, expected types, constraints)
	schema_description: str = ""

	# Validation rules in plain text
	validation_rules: str = ""

	# Task description
	task_description: str = ""

	# Feedback from previous step (empty on reset)
	feedback: str = ""

	# Current task ID
	task_id: str = ""

	# Number of planted issues (hint for the agent)
	num_issues_hint: int = 0

	# Max allowed steps for this task
	max_steps: int = 3


	class DataQAState(State):
	"""Tracks episode progress."""

	task_id: str = ""
	current_step: int = 0
	max_steps: int = 3
	best_score: float = 0.0
	total_planted_issues: int = 0