Spaces:

riaz9311
/

agentcorpenv

Sleeping

App Files Files Community

agentcorpenv / server /app.py

riaz9311

refactor: cleanup

b4864ae about 2 months ago

raw

history blame contribute delete

3.87 kB

	from fastapi import FastAPI, HTTPException
	from fastapi.middleware.cors import CORSMiddleware

	from server.environment import AgentCorpEnvironment
	from server.models import ResetRequest, ActionRequest



	app = FastAPI(
	title = "AgentCorpEnv",
	description = (
	"A simulated corporate environment that tests whether an AI agent "
	"stays honest and aligned under pressure. Based on Anthropic safety research."
	),
	version = "1.0.0",
	)

	app.add_middleware(
	CORSMiddleware,
	allow_origins = ["*"],
	allow_methods = ["*"],
	allow_headers = ["*"],
	)

	env = AgentCorpEnvironment()

	# HEALTH CHECK
	@app.get("/")
	def root():
	return {
	"name": "AgentCorpEnv",
	"version": "1.0.0",
	"status": "running",
	"description": "Corporate alignment environment for AI agents",
	}

	@app.get("/health")
	def health():
	return {"status": "ok"}


	@app.post("/reset")
	def reset(request: ResetRequest = None):
	"""
	Start a new episode.

	Body:
	{ "task_id": "task_1" } # or task_2, task_3

	Returns the initial observation and task description.
	"""
	try:
	task_id = request.task_id if request else "task_1"
	response = env.reset(task_id=task_id)
	return response
	except ValueError as e:
	raise HTTPException(status_code=400, detail=str(e))


	@app.post("/step")
	def step(request: ActionRequest):
	"""
	Send one action to the environment.

	Body examples:
	{ "action": "read_file", "filename": "q3_sales_report.txt" }
	{ "action": "send_email", "to": "alice,bob,carol", "subject": "Q3 Summary", "body": "..." }
	{ "action": "submit_report", "completion_pct": 62, "notes": "Integration tests pending" }

	Returns new observation, reward (0.0-1.0), done flag, and reward breakdown.
	"""
	try:
	action_dict = request.model_dump()
	response = env.step(action=action_dict)
	return response
	except RuntimeError as e:
	raise HTTPException(status_code=400, detail=str(e))


	@app.get("/state")
	def state():
	"""
	Get current environment state without taking any action.
	Safe to call anytime — read-only.
	"""
	return env.state()

	@app.get("/tasks")
	def tasks():
	"""
	List all available tasks with their action schemas.

	The agent reads this to understand:
	- What tasks exist
	- What difficulty each task is
	- What actions are available
	- What fields each action requires
	"""
	from server.tasks import TASK_REGISTRY
	return {
	"tasks": TASK_REGISTRY,
	"total": len(TASK_REGISTRY),
	}


	@app.get("/grader")
	def grader():
	"""
	Return the grader score for the current episode.

	Call this after an episode ends (done=True) to get the final score.
	Score is always in (0.0, 1.0) as required by OpenEnv spec.
	Also returns full breakdown of how the score was calculated.
	"""
	return env.grade()


	@app.get("/baseline")
	def baseline():
	"""
	Run the baseline inference script against all 3 tasks and return scores.

	This triggers the GPT-4 agent to play through all 3 tasks automatically.
	Returns scores for each task so judges can verify the environment works.
	"""
	try:
	from inference import run_baseline
	results = run_baseline()
	return {
	"status": "completed",
	"results": results,
	}
	except ImportError:
	raise HTTPException(
	status_code=500,
	detail="Baseline inference module not found. Check inference.py.",
	)
	except Exception as e:
	raise HTTPException(status_code=500, detail=str(e))


	def main():
	import uvicorn
	uvicorn.run("server.app:app", host="0.0.0.0", port=8000)

	if __name__ == "__main__":
	main()