Spaces:

eaglelandsonce
/

ONNX_Deployment_Example

Sleeping

App Files Files Community

ONNX_Deployment_Example / app.py

eaglelandsonce

Update app.py

35ce27f verified 13 days ago

raw

history blame contribute delete

4.31 kB

	import gradio as gr
	import numpy as np
	import onnxruntime as ort
	from pathlib import Path
	import traceback

	MODEL_PATH = Path("model.onnx")

	# Lazy-load so the Space doesn't crash on startup if model is missing
	_SESSION = None
	_INPUT_NAME = None


	def load_session():
	global _SESSION, _INPUT_NAME
	if _SESSION is not None:
	return _SESSION, _INPUT_NAME

	if not MODEL_PATH.exists():
	raise FileNotFoundError(
	"model.onnx not found in the Space root.\n"
	"Upload your ONNX model to the Space and name it exactly: model.onnx"
	)

	# CPU provider is most compatible on Spaces
	sess = ort.InferenceSession(str(MODEL_PATH), providers=["CPUExecutionProvider"])
	inp_name = sess.get_inputs()[0].name

	_SESSION = sess
	_INPUT_NAME = inp_name
	return _SESSION, _INPUT_NAME


	def predict_5(ret_1, ret_5, sma_ratio, rsi, vol):
	"""
	For your stock-signal wrapper ONNX that expects RAW features in this order:
	[ret_1, ret_5, sma_ratio, rsi, vol]

	Output is p_up (probability-like) if you exported with sigmoid in the wrapper.
	"""
	try:
	sess, inp_name = load_session()
	x = np.array([[ret_1, ret_5, sma_ratio, rsi, vol]], dtype=np.float32)
	y = sess.run(None, {inp_name: x})[0]
	p_up = float(np.array(y).reshape(-1)[0])

	# Optional simple signal thresholds for display
	if p_up >= 0.55:
	signal = "BUY (signal)"
	elif p_up <= 0.45:
	signal = "SELL (signal)"
	else:
	signal = "HOLD (signal)"

	details = {
	"input_order": ["ret_1", "ret_5", "sma_ratio", "rsi", "vol"],
	"p_up": p_up,
	"signal": signal,
	}
	return p_up, signal, details, "OK"
	except Exception:
	return None, None, None, traceback.format_exc()


	def predict_vector(vector_text: str):
	"""
	Generic mode if you want to paste a vector:
	"0.001, 0.01, 0.02, 55, 0.012"
	"""
	try:
	sess, inp_name = load_session()

	parts = [p for p in vector_text.replace(",", " ").split() if p.strip()]
	vals = [float(p) for p in parts]
	x = np.array([vals], dtype=np.float32)

	y = sess.run(None, {inp_name: x})[0]
	out = np.array(y).reshape(-1)

	return float(out[0]), out.tolist(), "OK"
	except Exception:
	return None, None, traceback.format_exc()


	with gr.Blocks(title="ONNX Inference (model.onnx)") as demo:
	gr.Markdown(
	"""
	# ONNX Inference (Hugging Face Space)

	How to use:
	1. Upload your ONNX model file into the Space repo root and name it `model.onnx`
	2. Use the 5-Feature Input tab (recommended) or the Vector Input tab.

	This Space runs ONNX Runtime on CPU for maximum compatibility.
	"""
	)

	with gr.Tab("5-Feature Input (recommended)"):
	with gr.Row():
	ret_1 = gr.Number(label="ret_1", value=0.001)
	ret_5 = gr.Number(label="ret_5", value=0.01)
	sma_ratio = gr.Number(label="sma_ratio", value=0.02)
	rsi = gr.Number(label="rsi", value=55.0)
	vol = gr.Number(label="vol", value=0.012)

	run_btn = gr.Button("Run inference", variant="primary")

	p_out = gr.Number(label="p_up (model output)")
	signal_out = gr.Textbox(label="Signal (optional thresholds)", lines=1)
	details_out = gr.JSON(label="Details")
	status_out = gr.Textbox(label="Status / Error", lines=10)

	run_btn.click(
	fn=predict_5,
	inputs=[ret_1, ret_5, sma_ratio, rsi, vol],
	outputs=[p_out, signal_out, details_out, status_out],
	)

	with gr.Tab("Vector Input (any shape)"):
	vector_text = gr.Textbox(
	label="Input vector (comma or space separated)",
	value="0.001, 0.01, 0.02, 55.0, 0.012",
	)
	run_btn2 = gr.Button("Run inference (vector)", variant="primary")

	first_out = gr.Number(label="First output value")
	full_out = gr.JSON(label="Full output array")
	status_out2 = gr.Textbox(label="Status / Error", lines=10)

	run_btn2.click(
	fn=predict_vector,
	inputs=[vector_text],
	outputs=[first_out, full_out, status_out2],
	)

	if __name__ == "__main__":
	demo.launch()