Spaces:

ajaxdavis
/

fourth-gpt-api

Sleeping

App Files Files Community

fourth-gpt-api / server.py

ajaxdavis

Upload folder using huggingface_hub

ec4c32b verified about 1 month ago

raw

history blame contribute delete

3.41 kB

	#!/usr/bin/env python3
	"""OpenAI-compatible Chat Completions API server for the Fourth GPT model."""

	import time
	import uuid
	import json
	import os
	from fastapi import FastAPI, HTTPException, Header
	from fastapi.middleware.cors import CORSMiddleware
	from pydantic import BaseModel
	from typing import Optional
	from model import FourthModel

	app = FastAPI(title="Fourth GPT API", version="1.0.0")
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_methods=["*"],
	allow_headers=["*"],
	)

	fourth = FourthModel()


	class Message(BaseModel):
	role: str
	content: str


	class ChatCompletionRequest(BaseModel):
	model: str = "fourth-gpt"
	messages: list[Message]
	max_tokens: int = 128
	temperature: float = 0.5
	stream: bool = False


	class Choice(BaseModel):
	index: int = 0
	message: Message
	finish_reason: str = "stop"


	class Usage(BaseModel):
	prompt_tokens: int
	completion_tokens: int
	total_tokens: int


	class ChatCompletionResponse(BaseModel):
	id: str
	object: str = "chat.completion"
	created: int
	model: str
	choices: list[Choice]
	usage: Usage


	class ModelInfo(BaseModel):
	id: str
	object: str = "model"
	created: int = 0
	owned_by: str = "fourth"


	class ModelList(BaseModel):
	object: str = "list"
	data: list[ModelInfo]


	@app.on_event("startup")
	def startup():
	fourth.load()


	@app.get("/")
	def root():
	return {"message": "Fourth GPT API is running", "model": "fourth-gpt", "params": 344256}


	@app.get("/v1/models")
	@app.get("/models")
	def list_models():
	return ModelList(data=[
	ModelInfo(id="fourth-gpt", created=int(time.time())),
	])


	@app.get("/v1/models/{model_id}")
	@app.get("/models/{model_id}")
	def get_model(model_id: str):
	if model_id != "fourth-gpt":
	raise HTTPException(status_code=404, detail="Model not found")
	return ModelInfo(id="fourth-gpt", created=int(time.time()))


	@app.post("/v1/chat/completions")
	@app.post("/chat/completions")
	def chat_completions(
	req: ChatCompletionRequest,
	authorization: Optional[str] = Header(None),
	):
	if not req.messages:
	raise HTTPException(status_code=400, detail="messages must not be empty")

	user_msg = None
	for msg in reversed(req.messages):
	if msg.role == "user":
	user_msg = msg.content
	break

	if user_msg is None:
	raise HTTPException(status_code=400, detail="No user message found")

	response_text = fourth.generate(
	prompt=user_msg,
	max_tokens=req.max_tokens,
	temperature=req.temperature,
	)

	prompt_tokens = len(user_msg)
	completion_tokens = len(response_text)

	return ChatCompletionResponse(
	id=f"chatcmpl-{uuid.uuid4().hex[:12]}",
	created=int(time.time()),
	model=req.model,
	choices=[
	Choice(
	message=Message(role="assistant", content=response_text),
	)
	],
	usage=Usage(
	prompt_tokens=prompt_tokens,
	completion_tokens=completion_tokens,
	total_tokens=prompt_tokens + completion_tokens,
	),
	)


	@app.get("/health")
	def health():
	return {"status": "ok", "model_loaded": fourth.model is not None}


	if __name__ == "__main__":
	import uvicorn
	port = int(os.environ.get("PORT", 7860))
	uvicorn.run(app, host="0.0.0.0", port=port)