Spaces:

100XZX001
/

CodeReview-Professional-Workflow

Sleeping

App Files Files Community

CodeReview-Professional-Workflow / openenv.yaml

100XZX001

Upload 16 files

1588266 verified 19 days ago

raw

history blame contribute delete

4.5 kB

	# openenv.yaml – Environment metadata for OpenEnv
	name: CodeReview-Professional-Workflow
	version: 1.0.0
	description: \|
	Multi‑turn code review environment for professional tasks.
	Agent must inspect, test, lint, query docs, and negotiate with a simulated author
	to fix injected bugs. Supports DPO training on full trajectories.
	author: yuvraj gupta
	license: MIT

	# ----------------------------------------------------------------------
	# Tasks (difficulty progression)
	# ----------------------------------------------------------------------
	tasks:
	- id: easy
	description: "Fix missing null check in a dictionary lookup"
	- id: medium
	description: "Improve loop efficiency (replace range(len) with direct iteration)"
	- id: hard
	description: "Handle division by zero in average calculation"
	- id: harder
	description: "Fix race condition by adding a lock"
	- id: hardest
	description: "Resolve potential deadlock by standardising lock order"

	# ----------------------------------------------------------------------
	# Observation space (complete Markov state – agent sees everything)
	# ----------------------------------------------------------------------
	observation_space:
	type: object
	properties:
	code_snippet:
	type: string
	description: "Current code snippet (may contain injected bug)"
	last_tool_output:
	type: string
	description: "Raw output from last tool (test runner, linter, etc.)"
	author_response:
	type: string
	description: "Latest feedback from the simulated human developer"
	current_test_score:
	type: number
	description: "Proportion of tests passed (0.0–1.0)"
	current_lint_score:
	type: number
	description: "Normalised pylint score (0.0–1.0)"
	negotiation_score:
	type: number
	description: "Author's confidence minus pushback penalty"
	previous_test_score:
	type: number
	description: "Test score before the last action"
	previous_lint_score:
	type: number
	description: "Lint score before the last action"
	author_confidence:
	type: number
	description: "Internal belief of the author (0.0–1.0)"
	author_threshold:
	type: number
	description: "Confidence threshold for this personality"
	step:
	type: integer
	description: "Current step number"
	max_steps:
	type: integer
	description: "Maximum steps allowed in the episode"
	progress_ratio:
	type: number
	description: "step / max_steps"
	tests_run:
	type: boolean
	description: "Whether the agent has run tests at least once"
	linter_run:
	type: boolean
	description: "Whether the agent has run the linter at least once"
	docs_queried:
	type: boolean
	description: "Whether the agent has queried documentation"
	last_action_type:
	type: string
	description: "String name of the last executed action"
	action_history:
	type: array
	items:
	type: string
	description: "Last 5 action types"
	done:
	type: boolean
	description: "Whether the episode has finished"
	bug_description:
	type: string
	description: "Short description of the injected bug"
	comments_count:
	type: integer
	description: "Number of comments exchanged so far"

	# ----------------------------------------------------------------------
	# Action space (short names as produced by the agent)
	# ----------------------------------------------------------------------
	action_space:
	type: object
	properties:
	action_type:
	type: string
	enum:
	- comment
	- skip
	- done
	- question
	- fix
	- execute
	- inspect
	- run_linter
	- run_tests
	- query_docs
	comment_text:
	type: string
	description: "Required for comment"
	question:
	type: string
	description: "Required for question"
	fix_code:
	type: string
	description: "Required for fix"
	query_topic:
	type: string
	description: "Required for query_docs"

	# ----------------------------------------------------------------------
	# (Optional) Server configuration – used by openenv serve
	# ----------------------------------------------------------------------
	server:
	app: server.app:app
	port: 7860