Spaces:

mg643
/

offrails

Sleeping

updated requirements, created docker file for HF deployment, modified lifespan to load model, stopped tracking joblib files

83a4e77 about 2 months ago

raw

history blame contribute delete

3.91 kB

	"""
	Agent Trace Anomaly Detection — FastAPI Backend

	This is the API layer that wraps the ML pipeline built in scripts/.
	All model training, feature extraction, and inference logic lives
	in the partner's code (scripts/inference.py). This file just serves it.

	Run from the OffRails project root:
	uvicorn app.main:app --reload --host 0.0.0.0 --port 8000

	Interactive docs:
	http://localhost:8000/docs
	"""

	from __future__ import annotations

	import os
	import sys
	import logging

	from fastapi import FastAPI
	from fastapi.middleware.cors import CORSMiddleware

	from contextlib import asynccontextmanager
	from app.api.routes import _state

	# ── Make partner's scripts/ importable ───────────────────────────────────────
	# inference.py does `from model import ...` and `from build_features import ...`
	# so we need scripts/ on sys.path.
	SCRIPTS_DIR = os.path.join(os.path.dirname(os.path.dirname(os.path.abspath(__file__))), "scripts")
	if SCRIPTS_DIR not in sys.path:
	sys.path.insert(0, SCRIPTS_DIR)

	from app.api.routes import router

	# ── Logging ──────────────────────────────────────────────────────────────────

	logging.basicConfig(
	level=logging.INFO,
	format="%(asctime)s %(levelname)-8s %(name)s — %(message)s",
	datefmt="%H:%M:%S",
	)

	logger = logging.getLogger(__name__)

	# ── App ──────────────────────────────────────────────────────────────────────

	@asynccontextmanager
	async def lifespan(app: FastAPI):
	from huggingface_hub import hf_hub_download
	from scripts.inference import TraceAnomalyDetector
	try:
	model_path = hf_hub_download(
	repo_id="mg643/offrails-models",
	filename="xgboost_model.joblib",
	)
	_state["detector"] = TraceAnomalyDetector(
	model_dir=os.path.dirname(model_path),
	model_type="xgboost"
	)
	_state["model_type"] = "xgboost"
	logger.info("XGBoost model loaded from HF Hub")
	except Exception as e:
	logger.warning(f"Could not load model: {e}")
	yield

	app = FastAPI(
	title="Agent Trace Anomaly Detection API",
	lifespan=lifespan,
	description=(
	"Detects anomalous agent execution traces — unnecessary tool calls, "
	"circular reasoning, and goal drift.\n\n"
	"ML models (XGBoost, DistilBERT) are trained via the pipeline in `scripts/`.\n"
	"This API serves predictions from those trained models.\n\n"
	"## Workflow\n"
	"1. Train models: `python setup.py` (or `POST /pipeline/train`)\n"
	"2. Load a model: `POST /models/load`\n"
	"3. Predict: `POST /predict`\n"
	"4. Compare models: `POST /predict/compare`\n"
	),
	version="1.0.0",
	)

	# Allow Gradio / any frontend to call the API
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	app.include_router(router)


	# ── Root ─────────────────────────────────────────────────────────────────────

	@app.get("/", include_in_schema=False)
	def root():
	return {
	"service": "Agent Trace Anomaly Detection API",
	"docs": "/docs",
	"workflow": [
	"1. Train models: python setup.py",
	"2. POST /models/load (load xgboost or distilbert)",
	"3. POST /predict (classify a trace)",
	"4. POST /predict/compare (run both models)",
	],
	}