Spaces:

Ramkan7
/

Patch_Hawk

Running

App Files Files Community

Patch_Hawk / patchhawk /tasks.py

kanishcr7

Final Submission: Added SOC Dashboard and fixed UI explorer

44b0b12 3 days ago

raw

history blame contribute delete

2.5 kB

	"""
	PatchHawk task graders — referenced in openenv.yaml.

	Each grader receives the environment and a trajectory (list of
	(action, observation) tuples), and returns a float score strictly in (0, 1).
	"""
	from __future__ import annotations
	from typing import TYPE_CHECKING, List, Tuple

	if TYPE_CHECKING:
	from patchhawk.agent.environment import PatchHawkEnv
	from patchhawk.env_models import PatchHawkAction, PatchHawkObservation

	# Action constants (mirrored from PatchHawkEnv)
	_ANALYZE = 0
	_EXECUTE_SANDBOX = 1
	_BLOCK_PR = 2
	_SUBMIT_PATCH = 3
	_REQUEST_REVIEW = 4

	def grade_easy(
	env: "PatchHawkEnv",
	trajectory: List[Tuple["PatchHawkAction", "PatchHawkObservation"]],
	) -> float:
	"""Easy task grader — typosquatting detection.

	Returns 0.99 if:
	- The last action is BLOCK_PR or SUBMIT_PATCH
	- The scenario's attack_type is "typosquatting"
	"""
	if not trajectory:
	return 0.01

	last_action, _last_obs = trajectory[-1]
	scenario = env.current_scenario or {}

	if last_action.action_type in (_BLOCK_PR, _SUBMIT_PATCH):
	if scenario.get("attack_type") == "typosquatting":
	return 0.99
	return 0.01


	def grade_medium(
	env: "PatchHawkEnv",
	trajectory: List[Tuple["PatchHawkAction", "PatchHawkObservation"]],
	) -> float:
	"""Medium task grader — obfuscated exec detection.

	Returns 0.99 if:
	- EXECUTE_SANDBOX was used at least once in the trajectory
	- The last action is BLOCK_PR or SUBMIT_PATCH
	- The scenario's attack_type is "obfuscated_exec"
	"""
	if not trajectory:
	return 0.01

	used_sandbox = any(a.action_type == _EXECUTE_SANDBOX for a, _o in trajectory)
	last_action, _last_obs = trajectory[-1]
	scenario = env.current_scenario or {}

	if (
	used_sandbox
	and last_action.action_type in (_BLOCK_PR, _SUBMIT_PATCH)
	and scenario.get("attack_type") == "obfuscated_exec"
	):
	return 0.99
	return 0.01


	def grade_hard(
	env: "PatchHawkEnv",
	trajectory: List[Tuple["PatchHawkAction", "PatchHawkObservation"]],
	) -> float:
	"""Hard task grader — validated patch submission.

	Returns 0.99 if:
	- The last action is SUBMIT_PATCH
	- env.state.patch_validated is True
	"""
	if not trajectory:
	return 0.01

	last_action, _last_obs = trajectory[-1]

	if last_action.action_type == _SUBMIT_PATCH and env.state.patch_validated:
	return 0.99
	return 0.01