Spaces:

Manas281
/

data-cleaning-openenv

Sleeping

App Files Files Community

data-cleaning-openenv / inference.py

Manas281

Update inference.py

b871adb verified about 1 month ago

raw

history blame contribute delete

5.61 kB

	"""
	inference.py — OpenEnv submission file
	"""
	import os, json, sys
	from openai import OpenAI
	from data_cleaning_env import DataCleaningEnvironment, CleaningAction

	# ── Config ────────────────────────────────────────────────────────────────────
	API_BASE_URL = os.getenv("API_BASE_URL", "https://api.groq.com/openai/v1")
	MODEL_NAME = os.getenv("MODEL_NAME", "openai/gpt-oss-120b") # Groq model name
	HF_TOKEN = os.getenv("HF_TOKEN")
	if HF_TOKEN is None:
	raise ValueError("HF_TOKEN environment variable is required")

	client = OpenAI(base_url=API_BASE_URL, api_key=HF_TOKEN)

	SYSTEM_PROMPT = (
	"You are a data cleaning expert. "
	"Respond ONLY with a valid JSON object, no markdown, no explanation.\n"
	'Format: {"action_type": "<remove_nulls\|fix_dates\|remove_outliers>", "column": "<col_or_null>"}'
	)

	TASK_NAMES = {1: "remove_nulls", 2: "fix_dates", 3: "remove_outliers"}
	ENV_NAME = "data_cleaning"


	def parse_llm_response(text: str, task_id: int) -> CleaningAction:
	text = text.strip().replace("```json", "").replace("```", "").strip()
	try:
	data = json.loads(text)
	action_type = data.get("action_type", "remove_nulls")
	if action_type not in ["remove_nulls", "fix_dates", "remove_outliers"]:
	action_type = "remove_nulls"
	return CleaningAction(
	task_id=task_id,
	action_type=action_type,
	column=data.get("column")
	)
	except Exception:
	if "date" in text.lower():
	return CleaningAction(task_id=task_id, action_type="fix_dates", column="hire_date")
	elif "outlier" in text.lower():
	return CleaningAction(task_id=task_id, action_type="remove_outliers", column="all")
	return CleaningAction(task_id=task_id, action_type="remove_nulls")


	def heuristic_action(task_id: int, obs) -> CleaningAction:
	if obs.null_count > 0:
	return CleaningAction(task_id=task_id, action_type="remove_nulls")
	elif obs.date_format_errors > 0:
	return CleaningAction(task_id=task_id, action_type="fix_dates", column="hire_date")
	else:
	return CleaningAction(task_id=task_id, action_type="remove_outliers", column="all")


	def run_episode(task_id: int, seed: int):
	env = DataCleaningEnvironment(task_id=task_id, seed=seed)
	obs = env.reset()
	error_str = "null"
	action = None

	user_msg = (
	f"Task {task_id}: {obs.task_description}\n"
	f"Nulls: {obs.null_count}, Date errors: {obs.date_format_errors}, "
	f"Outliers: {obs.outlier_count}\n"
	f"Preview:\n{obs.dataset_preview}\n"
	f"Respond with JSON only."
	)

	# ── Primary: LLM via OpenAI client ───────────────────────────────────────
	try:
	resp = client.chat.completions.create(
	model=MODEL_NAME,
	messages=[
	{"role": "system", "content": SYSTEM_PROMPT},
	{"role": "user", "content": user_msg},
	],
	max_tokens=100,
	temperature=0.1,
	)
	action = parse_llm_response(resp.choices[0].message.content, task_id)
	except Exception as e:
	error_str = str(e).replace("\n", " ")

	# ── Fallback: heuristic if LLM failed ────────────────────────────────────
	if action is None:
	action = heuristic_action(task_id, obs)

	col = action.column if action.column else "null"
	action_str = f"{action.action_type}('{col}')"

	_, reward, done, _ = env.step(action)
	if hasattr(env, "close"):
	env.close()

	return float(reward), action_str, bool(done), error_str


	def main():
	all_results = {}
	n_episodes = int(os.getenv("N_EPISODES", "10"))

	for task_id in [1, 2, 3]:
	task_name = TASK_NAMES[task_id]
	print(f"[START] task={task_name} env={ENV_NAME} model={MODEL_NAME}", flush=True)

	episode_rewards = []
	success = False
	score = 0.0

	try:
	for seed in range(n_episodes):
	reward, action_str, done, error_str = run_episode(task_id, seed)
	episode_rewards.append(reward)
	print(
	f"[STEP] step={seed + 1} action={action_str} "
	f"reward={reward:.2f} done={str(done).lower()} error={error_str}",
	flush=True,
	)

	score = sum(episode_rewards) / len(episode_rewards)
	score = round(min(max(score, 0.0), 1.0), 2)
	all_results[task_id] = score
	success = score > 0.0

	finally:
	rewards_str = ",".join(f"{r:.2f}" for r in episode_rewards)
	# ── [END] with score= field as required ──────────────────────────
	print(
	f"[END] success={str(success).lower()} "
	f"steps={len(episode_rewards)} "
	f"score={score:.2f} "
	f"rewards={rewards_str}",
	flush=True,
	)

	overall = round(sum(all_results.values()) / max(len(all_results), 1), 4)
	with open("scores.json", "w") as f:
	json.dump({"tasks": all_results, "overall": overall}, f, indent=2)
	print(f"[SUMMARY] overall_score={overall} task_scores={all_results}", flush=True)


	if __name__ == "__main__":
	main()