Spaces:

Sizzing
/

aws_rl_env

Running

App Files Files Community

aws_rl_env / models.py

Sizzing

Upload folder using huggingface_hub

0f8f2c1 verified about 1 month ago

raw

history blame contribute delete

10.9 kB

	"""
	Data models for the Aws Rl Env Environment.
	"""

	from enum import Enum
	from typing import NewType

	from openenv.core.env_server.types import Action, Observation, State
	from pydantic import BaseModel, Field

	# ---------------------------------------------------------------------------
	# Core Types
	# ---------------------------------------------------------------------------

	TaskID = NewType("TaskID", int)
	EpisodeID = NewType("EpisodeID", str)
	StepCount = NewType("StepCount", int)


	class AwsService(str, Enum):
	# Core services
	S3 = "s3"
	EC2 = "ec2"
	DYNAMODB = "dynamodb"
	LAMBDA = "lambda"
	SQS = "sqs"
	SNS = "sns"
	IAM = "iam"
	APIGATEWAY = "apigateway"
	SECRETSMANAGER = "secretsmanager"
	# Compute & containers
	ECS = "ecs"
	# Data & analytics
	RDS = "rds"
	ELASTICACHE = "elasticache"
	ATHENA = "athena"
	GLUE = "glue"
	FIREHOSE = "firehose"
	EMR = "emr"
	# Networking & routing
	APIGATEWAYV2 = "apigatewayv2"
	ROUTE53 = "route53"
	ELBV2 = "elbv2"
	# Storage
	EBS = "ebs"
	EFS = "efs"
	# Identity & config
	COGNITO = "cognito-idp"
	SSM = "ssm"
	EVENTBRIDGE = "events"
	# Monitoring
	CLOUDWATCH = "cloudwatch"
	# Infrastructure as code
	CLOUDFORMATION = "cloudformation"


	# ---------------------------------------------------------------------------
	# RL Task Definition
	# ---------------------------------------------------------------------------


	class TaskDifficulty(str, Enum):
	WARMUP = "warmup"
	BEGINNER = "beginner"
	INTERMEDIATE = "intermediate"
	ADVANCED = "advanced"
	EXPERT = "expert"


	class TierConfig(BaseModel):
	"""Configuration for a single difficulty tier's promotion and mastery rules."""

	min_episodes: int = Field(
	..., ge=0, description="Minimum episodes before promotion eligible"
	)
	advance_rate: float = Field(
	..., ge=0.0, le=1.0, description="Tier success rate to advance"
	)
	mastery_window: int = Field(
	default=10, ge=1, description="Sliding window size for success rate"
	)
	mastery_threshold: float = Field(
	default=0.7, ge=0.0, le=1.0, description="Per-task graduation threshold"
	)
	fast_track_rate: float = Field(
	default=0.9,
	ge=0.0,
	le=1.0,
	description="Success rate for early promotion after 3 episodes",
	)
	chaos_probability: float = Field(
	default=0.0,
	ge=0.0,
	le=1.0,
	description="Probability of chaos injection per step",
	)


	class SpacedRepState(BaseModel):
	"""Tracks spaced repetition schedule for a graduated task."""

	interval: int = Field(default=3, ge=1, description="Episodes until next re-test")
	last_graduated_episode: int = Field(
	default=0, ge=0, description="Episode number when task was last graduated"
	)


	class SetupCommand(BaseModel):
	"""A single AWS CLI command executed during environment setup before the agent acts."""

	command: str = Field(..., description="AWS CLI command to execute")
	description: str \| None = Field(
	default=None,
	description="Human-readable explanation of what this command sets up",
	)
	ignore_failure: bool = Field(
	default=False,
	description="If True, continue setup even if this command fails",
	)


	class ResourceExistsCheck(BaseModel):
	"""Checks that a specific named resource exists in MiniStack."""

	service: AwsService = Field(
	..., description="AWS service to verify the resource in"
	)
	name: str = Field(..., description="Exact resource name to verify")


	class StepCriteria(BaseModel):
	"""A single required step in a multi-step task."""

	operation: str = Field(..., description="AWS CLI operation, e.g. 'create-bucket'")
	resource: str \| None = Field(
	default=None, description="Resource name the operation must target"
	)


	class StateCheck(BaseModel):
	"""An assertion about the environment's end-state, evaluated via AWS CLI."""

	command: str = Field(..., description="AWS CLI command to run for verification")
	output_contains: str \| None = Field(
	default=None, description="Substring that must appear in stdout"
	)
	json_path: str \| None = Field(
	default=None,
	description="JSON path to extract from stdout, e.g. '$.Table.Name'",
	)
	expected: int \| float \| str \| bool \| None = Field(
	default=None, description="Expected value at json_path"
	)


	class SuccessCriteria(BaseModel):
	"""Machine-readable criteria to evaluate task completion.

	Different tiers populate different fields:
	- Warmup: command_contains + operation
	- Beginner: command_contains + operation + resource_exists
	- Intermediate: steps
	- Advanced: services + steps
	- Expert: services + state_checks + steps (optional)
	"""

	command_contains: str \| None = Field(
	default=None, description="Substring the agent's command must contain"
	)
	operation: str \| None = Field(
	default=None, description="AWS CLI operation the agent must invoke"
	)
	resource_exists: ResourceExistsCheck \| None = Field(
	default=None, description="Resource that must exist after the agent acts"
	)
	steps: list[StepCriteria] = Field(
	default_factory=list, description="Ordered sequence of required operations"
	)
	services: list[AwsService] = Field(
	default_factory=list, description="AWS services the agent must interact with"
	)
	state_checks: list[StateCheck] = Field(
	default_factory=list,
	description="End-state assertions — source of truth for expert/SRE tasks",
	)


	class Task(BaseModel):
	"""Defines a task the RL agent must accomplish in the AWS environment."""

	task_id: TaskID = Field(..., ge=0, description="Unique task identifier")
	difficulty: TaskDifficulty = Field(
	default=TaskDifficulty.WARMUP, description="Task difficulty level"
	)
	description: str = Field(..., description="Human-readable task description")
	success_criteria: SuccessCriteria = Field(
	default_factory=SuccessCriteria,
	description="Machine-readable criteria to evaluate task completion",
	)
	setup_commands: list[SetupCommand] = Field(
	default_factory=list,
	description="Commands to run during reset to set up initial state (e.g. for SRE tasks)",
	)
	desired_state_spec: str \| None = Field(
	default=None,
	description="Natural-language specification of the desired end state (shown to agent for drift tasks)",
	)
	possible_drifts: list[SetupCommand] = Field(
	default_factory=list,
	description="Pool of mutations the DriftEngine may randomly apply after setup",
	)


	class TaskInfo(BaseModel):
	"""Agent-visible subset of Task — masks success_criteria, setup_commands, and possible_drifts."""

	task_id: TaskID = Field(..., ge=0, description="Unique task identifier")
	difficulty: TaskDifficulty = Field(
	default=TaskDifficulty.WARMUP, description="Task difficulty level"
	)
	description: str = Field(..., description="Human-readable task description")
	desired_state_spec: str \| None = Field(
	default=None,
	description="Natural-language specification of the desired end state (shown to agent for drift tasks)",
	)

	@classmethod
	def from_task(cls, task: Task) -> "TaskInfo":
	"""Create a masked TaskInfo from a full Task."""
	return cls(
	task_id=task.task_id,
	difficulty=task.difficulty,
	description=task.description,
	desired_state_spec=task.desired_state_spec,
	)


	# ---------------------------------------------------------------------------
	# Environment State
	# ---------------------------------------------------------------------------


	class TrackerState(BaseModel):
	"""Serializable snapshot of the EpisodeTracker."""

	step_count: int = Field(default=0, ge=0, description="Steps taken this episode")
	hints_used: int = Field(default=0, ge=0, description="Hints requested this episode")
	progress: float = Field(
	default=0.0, ge=0.0, le=1.0, description="Current partial progress"
	)
	commands_executed: list[str] = Field(
	default_factory=list, description="Commands executed this episode"
	)
	credited_operations: list[str] = Field(
	default_factory=list,
	description="(operation, resource) pairs that earned credit",
	)


	class AwsRlState(State):
	"""Full environment state including task, tracker, and infrastructure."""

	current_task: Task \| None = Field(
	default=None, description="The task assigned for this episode"
	)
	tracker: TrackerState = Field(
	default_factory=TrackerState,
	description="Episode tracker snapshot",
	)
	infra_state: dict = Field(
	default_factory=dict,
	description="AWS infrastructure state keyed by service name",
	)
	chaos_occurred: bool = Field(
	default=False, description="Whether chaos was injected this episode"
	)
	current_tier: str = Field(
	default="warmup", description="Agent's current difficulty tier"
	)


	# ---------------------------------------------------------------------------
	# Action & Observation
	# ---------------------------------------------------------------------------


	class AwsRlAction(Action):
	"""Action for the Aws Rl Env environment — an AWS CLI command to execute against MiniStack."""

	command: str = Field(
	...,
	description="AWS CLI command to execute, e.g. 'aws s3 ls', 'aws ec2 describe-instances'",
	)


	class AwsRlObservation(Observation):
	"""Observation returned after each step in the AWS RL environment."""

	episode_id: EpisodeID = Field(..., description="Unique identifier for the episode")
	step_count: StepCount = Field(
	..., ge=0, description="Current step count in the episode"
	)
	command_success: bool = Field(
	..., description="Whether the CLI command executed successfully"
	)
	command_output: str = Field(
	default="", description="Stdout from the executed AWS CLI command"
	)
	error: str = Field(default="", description="Stderr if the command failed")
	task: TaskInfo \| None = Field(
	default=None, description="The task the agent is trying to accomplish (masked)"
	)
	task_achieved: bool = Field(
	default=False, description="Whether the task has been achieved"
	)
	partial_progress: float = Field(
	default=0.0,
	ge=0.0,
	le=1.0,
	description="Current task progress (0.0 to 1.0)",
	)
	hints_used: int = Field(
	default=0, ge=0, description="Number of hints requested this episode"
	)
	hint_text: str = Field(
	default="", description="Text of the most recently requested hint"
	)