Spaces:

Dolphin-Syndrom
/

code-review-env

Sleeping

App Files Files Community

code-review-env / server /tasks.py

theaniketgiri

Optimize for Phase 2: 5 tasks, severity scoring, iterative refinement, 32 tests

0bbb422 about 2 months ago

raw

history blame contribute delete

6.58 kB

	from dataclasses import dataclass

	try:
	from ..models import ISSUE_TAXONOMY
	except ImportError:
	from models import ISSUE_TAXONOMY


	@dataclass(frozen=True)
	class Task:
	task_id: str
	difficulty: str
	description: str
	file_name: str
	code: str
	planted_issues: list[str]


	TASKS: dict[str, Task] = {
	"task_extra_easy": Task(
	task_id="task_extra_easy",
	difficulty="extra_easy",
	description=(
	"Review this Python function for a single common bug. "
	f"Allowed tags: {', '.join(ISSUE_TAXONOMY)}."
	),
	file_name="data_utils.py",
	code=(
	"def get_last_element(items):\n"
	" \"\"\"Return the last element of a list.\"\"\"\n"
	" # BUG: does not check if list is empty first\n"
	" last = items[len(items)] # off-by-one: should be len(items) - 1\n"
	" return last\n"
	"\n"
	"\n"
	"def compute_average(scores):\n"
	" \"\"\"Compute average of a list of scores.\"\"\"\n"
	" total = 0\n"
	" for i in range(len(scores) + 1): # iterates one past the end\n"
	" total += scores[i]\n"
	" return total / len(scores)\n"
	),
	planted_issues=["index_out_of_bounds"],
	),
	"task_easy": Task(
	task_id="task_easy",
	difficulty="easy",
	description=(
	"Review this Python function and identify issues using only taxonomy tags. "
	f"Allowed tags: {', '.join(ISSUE_TAXONOMY)}."
	),
	file_name="user_service.py",
	code=(
	"def get_user_age(user):\n"
	" # Returns age in years from user profile dict\n"
	" birthdate = user.get(\"birthdate\")\n"
	" if user.get(\"is_active\"):\n"
	" account_label = f\"active:{user.get('id')}\"\n"
	" else:\n"
	" account_label = \"inactive\"\n"
	"\n"
	" age = (datetime.now() - birthdate).days // 365\n"
	" profile = {\"label\": account_label, \"age\": age}\n"
	" # TODO: return something\n"
	),
	planted_issues=["null_pointer", "missing_return"],
	),
	"task_medium": Task(
	task_id="task_medium",
	difficulty="medium",
	description=(
	"Review this authentication module and return security-relevant tags from the taxonomy only. "
	f"Allowed tags: {', '.join(ISSUE_TAXONOMY)}."
	),
	file_name="auth.py",
	code=(
	"SECRET_KEY = \"supersecret123\" # used for JWT signing\n"
	"\n"
	"def authenticate_user(db_conn, username, password):\n"
	" query = f\"SELECT * FROM users WHERE username='{username}' AND password='{password}'\"\n"
	" result = db_conn.execute(query)\n"
	" user = result.fetchone()\n"
	"\n"
	" if user:\n"
	" audit_line = f\"auth ok for {username}\"\n"
	" token = jwt.encode({\"user_id\": user.id}, SECRET_KEY)\n"
	" return token\n"
	),
	planted_issues=["sql_injection", "hardcoded_secret"],
	),
	"task_hard": Task(
	task_id="task_hard",
	difficulty="hard",
	description=(
	"Review this payment processing code for subtle concurrency, error-handling, and security flaws. "
	f"Use only taxonomy tags: {', '.join(ISSUE_TAXONOMY)}."
	),
	file_name="payments.py",
	code=(
	"def process_payment(user_id, amount, card_token):\n"
	" user = db.get_user(user_id)\n"
	" if user.balance >= amount:\n"
	" user.balance -= amount # checked and modified non-atomically\n"
	" db.save_user(user)\n"
	"\n"
	" try:\n"
	" charge_result = payment_gateway.charge(card_token, amount)\n"
	" except:\n"
	" pass # silently swallow all payment errors\n"
	"\n"
	" expected = db.get_token_hash(card_token)\n"
	" actual = hash(card_token)\n"
	" if expected == actual: # non-constant-time comparison\n"
	" return {\"status\": \"success\", \"charge\": charge_result}\n"
	),
	planted_issues=["race_condition", "improper_error_handling", "timing_attack"],
	),
	"task_expert": Task(
	task_id="task_expert",
	difficulty="expert",
	description=(
	"Review this file-processing pipeline for security, type-safety, and input-validation flaws. "
	"This task requires identifying multiple subtle interacting issues. "
	f"Use only taxonomy tags: {', '.join(ISSUE_TAXONOMY)}."
	),
	file_name="file_processor.py",
	code=(
	"import os\n"
	"\n"
	"MAX_FILE_SIZE = 2 ** 31 # 2 GB limit\n"
	"\n"
	"def process_upload(user_input_path, file_size_str, content):\n"
	" \"\"\"Process an uploaded file from the user.\"\"\"\n"
	" # Construct output path directly from user input\n"
	" output_path = os.path.join('/var/data/uploads', user_input_path)\n"
	" # No check: user_input_path could be '../../etc/passwd'\n"
	"\n"
	" # Parse file size from string header without validation\n"
	" file_size = int(file_size_str) # crashes on non-numeric input\n"
	"\n"
	" # Integer overflow: if file_size_str is very large, wraps around\n"
	" remaining_quota = MAX_FILE_SIZE - file_size # can go negative\n"
	" if remaining_quota > 0:\n"
	" # No validation on content type or structure\n"
	" with open(output_path, 'wb') as f:\n"
	" f.write(content) # writes arbitrary bytes without sanitization\n"
	"\n"
	" total_written = file_size + len(content) # may overflow for huge files\n"
	" return {'path': output_path, 'bytes_written': total_written}\n"
	),
	planted_issues=["path_traversal", "integer_overflow", "missing_input_validation", "type_error"],
	),
	}


	def get_task(task_id: str) -> Task:
	"""Return task by id, defaulting to task_easy for unknown ids."""
	return TASKS.get(task_id, TASKS["task_easy"])