Spaces:

thesupremeguy
/

hackathon

Sleeping

hackathon / inference.py

suhaas-code

phase2-graders-8

f3a7559 about 1 month ago

13.9 kB

	from __future__ import annotations

	import json
	import os
	import re
	from pathlib import Path
	from typing import Any, Dict, Optional
	from urllib.parse import urlparse

	try:
	from dotenv import load_dotenv
	except Exception:
	def load_dotenv(_args: Any, *_kwargs: Any) -> bool:
	return False

	try:
	from openai import OpenAI
	except Exception:
	OpenAI = None # type: ignore[assignment]

	from env.farm_env import FarmAction, FarmEnv, FarmState
	from tasks.graders import grade_all
	from tasks.task_definitions import get_all_tasks

	PROJECT_ROOT = Path(__file__).resolve().parent
	ENV_FILE = PROJECT_ROOT / ".env"
	load_dotenv(ENV_FILE)


	def require_env(name: str) -> str:
	value = os.getenv(name, "").strip()
	if not value:
	raise RuntimeError(
	f"Missing required environment variable '{name}'. "
	f"Set it in shell or in {ENV_FILE}."
	)
	return value


	API_BASE_URL = os.getenv("API_BASE_URL", "https://api.openai.com/v1").strip()
	MODEL_NAME = os.getenv("MODEL_NAME", "gpt-4o-mini").strip()
	BENCHMARK = os.getenv("BENCHMARK", "farmrl").strip()


	def resolve_task_ids() -> list[str]:
	configured = os.getenv("TASK_NAMES", "").strip()
	available_task_ids = [task["id"] for task in get_all_tasks()]

	if configured:
	requested = [item.strip() for item in configured.split(",") if item.strip()]
	filtered = [task_id for task_id in requested if task_id in available_task_ids]
	if filtered:
	return filtered

	legacy_single_task = os.getenv("TASK_NAME", "").strip()
	if legacy_single_task and legacy_single_task in available_task_ids:
	return [legacy_single_task]

	return available_task_ids


	TASK_IDS = resolve_task_ids()


	def resolve_api_key() -> str:
	api_key = os.getenv("API_KEY", "").strip()
	if api_key:
	return api_key
	return os.getenv("OPENAI_API_KEY", "").strip()


	API_KEY = resolve_api_key()

	PLACEHOLDER_TOKENS = {
	"your_openai_api_key_here",
	"replace_with_openai_api_key",
	"replace-me",
	"replace_me",
	}

	EPISODES = 3
	STEPS_PER_EPISODE = 20
	SUCCESS_SCORE_THRESHOLD = 0.10


	def clamp(value: float, low: float, high: float) -> float:
	return max(low, min(high, value))


	def clamp_score(score: float) -> float:
	return max(0.001, min(0.994, float(score)))


	def compute_yield_proxy(state: FarmState) -> float:
	moisture_score = clamp(state.soil_moisture / 100.0, 0.0, 1.0)
	temperature_factor = clamp(
	1.0 - abs(state.temperature - 26.0) / 16.0, 0.0, 1.0)
	rainfall_factor = clamp(1.0 - abs(state.rainfall - 60.0) / 60.0, 0.0, 1.0)
	return 0.4 * moisture_score + 0.3 * temperature_factor + 0.3 * rainfall_factor


	def build_prompt(state: FarmState, step: int, recent_actions: list[dict[str, float]]) -> str:
	recent_actions_text = "none"
	if recent_actions:
	recent_actions_text = json.dumps(recent_actions[-3:])
	previous_action_text = "none"
	if recent_actions:
	previous_action_text = json.dumps(recent_actions[-1])

	return (
	"Farm state:\n"
	f"step: {step}\n"
	f"soil moisture: {state.soil_moisture:.2f}\n"
	f"temperature: {state.temperature:.2f}\n"
	f"rainfall: {state.rainfall:.2f}\n"
	f"crop stage: {state.crop_stage}\n"
	f"day: {state.day}\n"
	f"previous action: {previous_action_text}\n"
	f"recent actions: {recent_actions_text}\n\n"
	"Choose action values in bounds:\n"
	"water: 0 to 50\n"
	"fertilizer: 0 to 20\n"
	"pesticide: 0 to 10\n\n"
	"Output must be a single valid JSON object with exactly these numeric keys: "
	"water, fertilizer, pesticide.\n"
	"If the previous action is identical, change at least one field by >= 2 unless safety constraints require otherwise."
	)


	def build_client() -> Optional[Any]:
	if OpenAI is None:
	raise RuntimeError("openai_sdk_unavailable")

	if not API_BASE_URL:
	raise RuntimeError(
	"Missing required environment variable 'API_BASE_URL'.")

	base_lower = API_BASE_URL.lower()
	if "huggingface.co" in base_lower:
	raise RuntimeError(
	"Disallowed API_BASE_URL host 'huggingface.co' for submission."
	)

	api_key = API_KEY
	if not api_key or api_key.lower() in PLACEHOLDER_TOKENS:
	raise RuntimeError(
	"Missing API key. Expected API_KEY (or OPENAI_API_KEY compatibility fallback)."
	)

	base_host = urlparse(API_BASE_URL).netloc or API_BASE_URL
	print(
	f"[INFO] llm_config base_host={base_host} model={MODEL_NAME}",
	flush=True,
	)
	return OpenAI(base_url=API_BASE_URL, api_key=api_key)


	def extract_json_object(text: str) -> Optional[Dict[str, Any]]:
	text = text.strip()
	if not text:
	return None

	try:
	parsed = json.loads(text)
	if isinstance(parsed, dict):
	return parsed
	except json.JSONDecodeError:
	pass

	match = re.search(r"\{.*\}", text, flags=re.DOTALL)
	if not match:
	return None

	try:
	parsed = json.loads(match.group(0))
	if isinstance(parsed, dict):
	return parsed
	except json.JSONDecodeError:
	return None
	return None


	def coerce_action(payload: Dict[str, Any]) -> FarmAction:
	if "water" not in payload or "fertilizer" not in payload or "pesticide" not in payload:
	raise ValueError(
	"Model response must include water, fertilizer, and pesticide.")

	water = float(payload["water"])
	fertilizer = float(payload["fertilizer"])
	pesticide = float(payload["pesticide"])

	normalized = {
	"water": clamp(water, 0.0, 50.0),
	"fertilizer": clamp(fertilizer, 0.0, 20.0),
	"pesticide": clamp(pesticide, 0.0, 10.0),
	}
	return FarmAction(**normalized)


	def choose_fallback_action(state: FarmState, recent_actions: list[dict[str, float]]) -> FarmAction:
	# Rule-based action used when LLM is unavailable or returns invalid output.
	target_moisture = 62.0 if state.crop_stage < 3 else 68.0
	moisture_gap = target_moisture - state.soil_moisture
	rain_adjustment = max(0.0, 50.0 - state.rainfall) * 0.1

	water = clamp(12.0 + 0.8 * moisture_gap + rain_adjustment, 0.0, 50.0)
	fertilizer = clamp(
	(6.0 if state.crop_stage < 4 else 4.0)
	- 0.05 * max(0, state.day - 10)
	- 0.1 * max(state.temperature - 32.0, 0.0),
	0.0,
	20.0,
	)

	pesticide = 1.0
	if state.crop_stage >= 2 and state.rainfall > 70.0:
	pesticide = 3.0
	pesticide = clamp(pesticide, 0.0, 10.0)

	action = {
	"water": water,
	"fertilizer": fertilizer,
	"pesticide": pesticide,
	}

	if recent_actions and action == recent_actions[-1]:
	action["water"] = clamp(action["water"] + 2.0, 0.0, 50.0)

	return FarmAction(**action)


	def choose_action(
	client: Optional[Any],
	state: FarmState,
	step: int,
	recent_actions: list[dict[str, float]],
	) -> FarmAction:
	if client is None:
	raise RuntimeError("llm_client_unavailable")

	prompt = build_prompt(state, step=step, recent_actions=recent_actions)
	completion = client.chat.completions.create(
	model=MODEL_NAME,
	messages=[
	{
	"role": "system",
	"content": (
	"You are a farm operations optimizer. "
	"Produce state-dependent control decisions and avoid repetitive action loops. "
	"Return strict JSON with numeric keys: water, fertilizer, pesticide. "
	"No markdown, no prose, no extra keys. "
	"Do not output the same action repeatedly across steps unless explicitly necessary."
	),
	},
	{"role": "user", "content": prompt},
	],
	temperature=0.35,
	top_p=0.9,
	frequency_penalty=0.6,
	response_format={"type": "json_object"},
	seed=42 + step,
	max_tokens=160,
	)

	content = (completion.choices[0].message.content or "").strip()
	payload = extract_json_object(content)
	if payload is None:
	raise ValueError("Model did not return valid JSON action payload.")
	return coerce_action(payload)


	def to_action_string(action: FarmAction) -> str:
	return json.dumps(action.model_dump(), separators=(",", ":"), sort_keys=True)


	def log_start(task_id: str) -> None:
	print(
	f"[START] task={task_id} env={BENCHMARK} model={MODEL_NAME}", flush=True)


	def log_step(step: int, action: FarmAction, reward: float, done: bool, error: Optional[str]) -> None:
	error_value = error if error else "null"
	done_value = str(done).lower()
	action_str = to_action_string(action)
	print(
	f"[STEP] step={step} action={action_str} reward={reward:.2f} "
	f"done={done_value} error={error_value}",
	flush=True,
	)


	def log_end(success: bool, steps: int, score: float, rewards: list[float]) -> None:
	rewards_str = ",".join(f"{value:.2f}" for value in rewards)
	print(
	f"[END] success={str(success).lower()} steps={steps} "
	f"score={score:.3f} rewards={rewards_str}",
	flush=True,
	)


	def run_inference() -> None:
	dataset_path = Path(__file__).resolve().parent / \
	"farmer_advisor_dataset.csv"
	env = FarmEnv(dataset_path=dataset_path, seed=42, max_days=30)
	try:
	client = build_client()
	except Exception as exc:
	client = None
	print(
	f"[WARN] llm_client_init_failed error={exc.__class__.__name__}",
	flush=True,
	)

	llm_attempts_total = 0
	llm_successes_total = 0
	llm_failures_total = 0

	for task_id in TASK_IDS:
	total_reward = 0.0
	total_yield = 0.0
	total_fertilizer = 0.0
	total_pesticide = 0.0
	total_steps = 0
	soil_moisture_sum = 0.0
	soil_ph_sum = 0.0
	soil_observation_count = 0
	rewards: list[float] = []
	recent_actions: list[dict[str, float]] = []
	aborted = False

	log_start(task_id=task_id)

	for episode in range(EPISODES):
	state = env.reset(seed=42 + episode)

	for _ in range(STEPS_PER_EPISODE):
	step_error: Optional[str] = None

	llm_attempts_total += 1
	try:
	action = choose_action(
	client=client,
	state=state,
	step=total_steps + 1,
	recent_actions=recent_actions,
	)
	llm_successes_total += 1
	except Exception as exc:
	llm_failures_total += 1
	step_error = f"llm_error:{exc.__class__.__name__}"
	action = choose_fallback_action(state, recent_actions)

	try:
	step_result = env.step(action)
	except Exception as exc:
	aborted = True
	log_step(
	step=total_steps + 1,
	action=action,
	reward=0.0,
	done=True,
	error=f"env_error:{exc.__class__.__name__}",
	)
	break

	total_steps += 1
	total_reward += step_result.reward
	total_yield += compute_yield_proxy(step_result.observation)
	total_fertilizer += action.fertilizer
	total_pesticide += action.pesticide
	soil_moisture_sum += step_result.observation.soil_moisture
	soil_ph_sum += step_result.observation.soil_ph
	soil_observation_count += 1
	rewards.append(step_result.reward)
	recent_actions.append(action.model_dump())

	log_step(
	step=total_steps,
	action=action,
	reward=step_result.reward,
	done=step_result.done,
	error=step_error,
	)
	state = step_result.observation

	if step_result.done:
	break

	if aborted:
	break

	avg_soil_moisture = (
	soil_moisture_sum / soil_observation_count if soil_observation_count > 0 else 50.0
	)
	avg_soil_ph = soil_ph_sum / soil_observation_count if soil_observation_count > 0 else 6.8

	task_scores = grade_all(
	total_reward=total_reward,
	total_yield=total_yield,
	total_fertilizer=total_fertilizer,
	total_pesticide=total_pesticide,
	total_steps=total_steps,
	avg_soil_moisture=avg_soil_moisture,
	avg_soil_ph=avg_soil_ph,
	)

	task_result = task_scores.get(task_id, {"score": 0.001})
	try:
	task_score = clamp_score(float(task_result.get("score", 0.001)))
	except Exception:
	task_score = 0.001

	success = task_score >= SUCCESS_SCORE_THRESHOLD
	log_end(success=success, steps=total_steps, score=task_score, rewards=rewards)

	if llm_attempts_total == 0:
	raise RuntimeError("No LLM calls were attempted during inference.")

	print(
	f"[INFO] llm_calls attempts={llm_attempts_total} successes={llm_successes_total} failures={llm_failures_total}",
	flush=True,
	)


	def main() -> int:
	try:
	run_inference()
	except Exception as exc:
	fatal_error = re.sub(
	r"\s+",
	" ",
	f"{exc.__class__.__name__}:{exc}",
	).strip()
	print(f"[FATAL] error={fatal_error}", flush=True)
	log_end(success=False, steps=0, score=0.001, rewards=[])
	return 1
	return 0


	if __name__ == "__main__":
	raise SystemExit(main())