Spaces:

Codex47
/

SmartContractAudit

Sleeping

SmartContractAudit / server /tasks /task3 /grader.py

ajaxwin

refactor: Reward clamping in graders

41a051f 22 days ago

2.2 kB

	"""
	grader.py (Task 3 – Rule Checker)
	------------------------------------
	Deterministic grader for function-identification submissions.

	Grade table
	───────────
	1 → submitted function is the exact target (case-insensitive)
	0.50 → submitted function is a direct internal subfunction of the target
	0.001 → anything else

	"""

	import json
	from math import exp
	from typing import Dict, Any

	class Task3Grader:
	"""
	Grades a Task 3 submit_function submission.

	Parameters
	----------
	target_function : dict with at least 'name' and 'code' keys
	property_specification : the property the target function violates
	"""

	REWARD_CORRECT = 1
	REWARD_PARTIAL = 0.5
	REWARD_WRONG = 0.001

	def __init__(self, target_function: Dict[str, Any], property_specification: Dict \| str, max_steps: int) -> None:
	self.target_function = target_function
	self.property_specification = property_specification
	self.max_steps = max_steps
	self._decay = 0.01

	def _clamp(self, reward: float) -> float:
	return max(0.001, min(0.999, reward))

	def grade(self, submitted_function: str, steps: int, cummulative_cost: int) -> float:
	"""Returns deterministic grade strictly in (0, 1)."""

	norm = submitted_function.strip().lower()
	reward = self.REWARD_WRONG
	if norm == self.target_function["name"].strip().lower():
	reward = self.REWARD_CORRECT
	elif norm in self.target_function.get("code", "").strip().lower():
	reward = self.REWARD_PARTIAL

	penalty = self._decay ** (-(steps * cummulative_cost) / self.max_steps)
	return self._clamp(reward * penalty)

	def get_canonical_answer(self) -> Dict[str, Dict \| str]:
	"""For debugging / logging only — do not expose to the agent."""
	return {
	"target_function": self.target_function,
	"property_specification": json.dumps(self.property_specification)
	if isinstance(self.property_specification, dict) else self.property_specification,
	}