Spaces:

GambitFlow
/

Nexus-Nano-Inference-api

Sleeping

App Files Files Community

Nexus-Nano-Inference-api / app.py

Rafs-an09002

Update app.py

d03718f verified about 2 months ago

raw

history blame

9.14 kB

	"""
	Nexus-Nano Inference API - Path Fixed
	Model: /app/models/nexus-nano.onnx
	Ultra-lightweight single-file engine
	"""

	from fastapi import FastAPI, HTTPException
	from fastapi.middleware.cors import CORSMiddleware
	from pydantic import BaseModel, Field
	import onnxruntime as ort
	import numpy as np
	import chess
	import time
	import logging
	import os
	from typing import Optional, Tuple

	logging.basicConfig(
	level=logging.INFO,
	format='%(asctime)s - %(levelname)s - %(message)s'
	)
	logger = logging.getLogger(__name__)

	# ==================== NANO ENGINE ====================

	class NexusNanoEngine:
	"""Ultra-lightweight chess engine"""

	PIECE_VALUES = {
	chess.PAWN: 1, chess.KNIGHT: 3, chess.BISHOP: 3,
	chess.ROOK: 5, chess.QUEEN: 9, chess.KING: 0
	}

	def __init__(self, model_path: str):
	if not os.path.exists(model_path):
	raise FileNotFoundError(f"Model not found: {model_path}")

	logger.info(f"📦 Loading model: {model_path}")
	logger.info(f"💾 Size: {os.path.getsize(model_path)/(1024*1024):.2f} MB")

	sess_options = ort.SessionOptions()
	sess_options.intra_op_num_threads = 2
	sess_options.graph_optimization_level = ort.GraphOptimizationLevel.ORT_ENABLE_ALL

	self.session = ort.InferenceSession(
	model_path,
	sess_options=sess_options,
	providers=['CPUExecutionProvider']
	)

	self.input_name = self.session.get_inputs()[0].name
	self.output_name = self.session.get_outputs()[0].name
	self.nodes = 0

	logger.info("✅ Engine ready!")

	def fen_to_tensor(self, fen: str) -> np.ndarray:
	board = chess.Board(fen)
	tensor = np.zeros((1, 12, 8, 8), dtype=np.float32)

	piece_map = {
	chess.PAWN: 0, chess.KNIGHT: 1, chess.BISHOP: 2,
	chess.ROOK: 3, chess.QUEEN: 4, chess.KING: 5
	}

	for sq, piece in board.piece_map().items():
	r, f = divmod(sq, 8)
	ch = piece_map[piece.piece_type] + (6 if piece.color == chess.BLACK else 0)
	tensor[0, ch, r, f] = 1.0

	return tensor

	def evaluate(self, board: chess.Board) -> float:
	self.nodes += 1
	tensor = self.fen_to_tensor(board.fen())
	output = self.session.run([self.output_name], {self.input_name: tensor})
	score = float(output[0][0][0]) * 400.0
	return -score if board.turn == chess.BLACK else score

	def order_moves(self, board: chess.Board, moves):
	scored = []
	for m in moves:
	s = 0
	if board.is_capture(m):
	v = board.piece_at(m.to_square)
	a = board.piece_at(m.from_square)
	if v and a:
	s = self.PIECE_VALUES.get(v.piece_type, 0) * 10
	s -= self.PIECE_VALUES.get(a.piece_type, 0)
	if m.promotion == chess.QUEEN:
	s += 90
	scored.append((s, m))
	scored.sort(key=lambda x: x[0], reverse=True)
	return [m for _, m in scored]

	def alpha_beta(
	self,
	board: chess.Board,
	depth: int,
	alpha: float,
	beta: float
	) -> Tuple[float, Optional[chess.Move]]:

	if board.is_game_over():
	return (-10000 if board.is_checkmate() else 0), None

	if depth == 0:
	return self.evaluate(board), None

	moves = list(board.legal_moves)
	if not moves:
	return 0, None

	moves = self.order_moves(board, moves)

	best_move = moves[0]
	best_score = float('-inf')

	for move in moves:
	board.push(move)
	score, _ = self.alpha_beta(board, depth - 1, -beta, -alpha)
	score = -score
	board.pop()

	if score > best_score:
	best_score = score
	best_move = move

	alpha = max(alpha, score)
	if alpha >= beta:
	break

	return best_score, best_move

	def search(self, fen: str, depth: int = 3):
	board = chess.Board(fen)
	self.nodes = 0

	moves = list(board.legal_moves)
	if len(moves) == 0:
	return {'best_move': '0000', 'evaluation': 0.0, 'nodes': 0, 'depth': 0}

	if len(moves) == 1:
	return {
	'best_move': moves[0].uci(),
	'evaluation': round(self.evaluate(board) / 100.0, 2),
	'nodes': 1,
	'depth': 0
	}

	best_move = moves[0]
	best_score = float('-inf')
	current_depth = 1

	for d in range(1, depth + 1):
	try:
	score, move = self.alpha_beta(board, d, float('-inf'), float('inf'))
	if move:
	best_move = move
	best_score = score
	current_depth = d
	except:
	break

	return {
	'best_move': best_move.uci(),
	'evaluation': round(best_score / 100.0, 2),
	'depth': current_depth,
	'nodes': self.nodes
	}


	# ==================== FASTAPI APP ====================

	app = FastAPI(
	title="Nexus-Nano Inference API",
	description="Ultra-lightweight chess engine",
	version="1.0.0"
	)

	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	engine = None


	class MoveRequest(BaseModel):
	fen: str
	depth: Optional[int] = Field(3, ge=1, le=5)


	class MoveResponse(BaseModel):
	best_move: str
	evaluation: float
	depth_searched: int
	nodes_evaluated: int
	time_taken: int


	@app.on_event("startup")
	async def startup():
	global engine
	logger.info("🚀 Starting Nexus-Nano API...")

	# FIXED: Correct path with hyphen
	model_path = "/app/models/nexus-nano.onnx"

	logger.info(f"🔍 Looking for: {model_path}")

	if os.path.exists("/app/models"):
	logger.info("📂 Files in /app/models/:")
	for f in os.listdir("/app/models"):
	full_path = os.path.join("/app/models", f)
	if os.path.isfile(full_path):
	size = os.path.getsize(full_path) / (1024*1024)
	logger.info(f" ✓ {f} ({size:.2f} MB)")
	else:
	logger.error("❌ /app/models/ not found!")
	raise FileNotFoundError("/app/models/ directory missing")

	if not os.path.exists(model_path):
	logger.error(f"❌ Model not found: {model_path}")
	logger.error("💡 Available:", os.listdir("/app/models"))
	raise FileNotFoundError(f"Missing: {model_path}")

	try:
	engine = NexusNanoEngine(model_path)
	logger.info("🎉 Nexus-Nano ready!")
	except Exception as e:
	logger.error(f"❌ Load failed: {e}", exc_info=True)
	raise


	@app.get("/health")
	async def health():
	return {
	"status": "healthy" if engine else "unhealthy",
	"model": "nexus-nano",
	"version": "1.0.0",
	"model_loaded": engine is not None,
	"model_path": "/app/models/nexus-nano.onnx"
	}


	@app.post("/get-move", response_model=MoveResponse)
	async def get_move(req: MoveRequest):
	if not engine:
	raise HTTPException(status_code=503, detail="Engine not loaded")

	try:
	chess.Board(req.fen)
	except:
	raise HTTPException(status_code=400, detail="Invalid FEN")

	start = time.time()

	try:
	result = engine.search(req.fen, req.depth)
	elapsed = int((time.time() - start) * 1000)

	logger.info(
	f"✓ Move: {result['best_move']} \| "
	f"Eval: {result['evaluation']:+.2f} \| "
	f"Depth: {result['depth']} \| "
	f"Nodes: {result['nodes']} \| "
	f"Time: {elapsed}ms"
	)

	return MoveResponse(
	best_move=result['best_move'],
	evaluation=result['evaluation'],
	depth_searched=result['depth'],
	nodes_evaluated=result['nodes'],
	time_taken=elapsed
	)

	except Exception as e:
	logger.error(f"❌ Search error: {e}", exc_info=True)
	raise HTTPException(status_code=500, detail=str(e))


	@app.get("/")
	async def root():
	return {
	"name": "Nexus-Nano Inference API",
	"version": "1.0.0",
	"model": "2.8M parameters",
	"architecture": "Compact ResNet",
	"speed": "0.2-0.5s per move @ depth 3",
	"status": "online" if engine else "starting",
	"endpoints": {
	"POST /get-move": "Get best move",
	"GET /health": "Health check",
	"GET /docs": "API docs"
	}
	}


	if __name__ == "__main__":
	import uvicorn
	uvicorn.run(
	app,
	host="0.0.0.0",
	port=7860,
	log_level="info",
	access_log=True
	)