Spaces:

zeeshan391
/

fast_api_deploy

Sleeping

App Files Files Community

fast_api_deploy / app.py

zeeshan391

updated

357c729 verified over 1 year ago

raw

history blame contribute delete

5.33 kB

	from fastapi import FastAPI, HTTPException
	from pydantic import BaseModel
	from langchain_community.llms import LlamaCpp
	from huggingface_hub.file_download import http_get
	from llama_cpp import Llama
	from langchain_core.callbacks import CallbackManager, StreamingStdOutCallbackHandler
	from langchain_core.prompts import ChatPromptTemplate

	import os
	import fal_client

	# FastAPI app
	app = FastAPI()

	# Set the environment variable
	os.environ['FAL_KEY'] = 'bb79b746-999d-4bec-af22-04fddb05d087:49350e8b76fd8dda0fb9dd8442a9ccf5'

	# Request body model
	class StoryRequest(BaseModel):
	mood: str
	story_type: str
	theme: str
	num_scenes: int
	txt: str

	# Initialize the LLM
	callback_manager = CallbackManager([StreamingStdOutCallbackHandler()])

	def load_model(
	directory: str = ".",
	model_name: str = "natsumura-storytelling-rp-1.0-llama-3.1-8B.Q3_K_M.gguf",
	model_url: str = "https://huggingface.co/tohur/natsumura-storytelling-rp-1.0-llama-3.1-8b-GGUF/resolve/main/natsumura-storytelling-rp-1.0-llama-3.1-8B.Q3_K_M.gguf"
	):
	final_model_path = os.path.join(directory, model_name)

	print("Downloading all files...")
	if not os.path.exists(final_model_path):
	with open(final_model_path, "wb") as f:
	http_get(model_url, f)
	os.chmod(final_model_path, 0o777)
	print("Files downloaded!")

	# model = Llama(
	# model_path=final_model_path,
	# n_ctx=1024
	# )

	# model = LlamaCpp(
	# model_path=final_model_path,
	# temperature=0.3,
	# max_tokens=2000,
	# top_p=1,
	# n_ctx=1024,
	# callback_manager=callback_manager,
	# verbose=True,
	# )

	model = Llama(
	model_path=final_model_path,
	temperature=0.3,
	max_tokens=2000,
	n_ctx=1024,
	top_p=1,
	# n_threads=8,
	echo=False
	)


	print("Model loaded!")
	return model


	llm = load_model()




	# Create a prompt template
	# system = """You are a helpful and creative assistant that specializes in generating engaging and imaginative stories for kids.
	# Based on the user's provided mood, preferred story type, theme, age, and desired story length of 500-600 words, create a unique and captivating story.
	# Always start with Story Title then generate a single story and dont ask for any feedback at the end just sign off with a cute closing inviting the reader
	# to create another adventure soon!
	# """

	system = """You are a helpful and creative assistant that specializes in generating engaging and imaginative short storie for kids.
	Based on the user's provided mood, preferred story type, theme, age, and desired story length of 500-600 words, create a unique and captivating story.
	Always start with Story Title then generate a single story.Storie begin on Page 1(also mention the all pages headings in bold) and end on Page 7.
	Total pages in storie are seven each page have one short paragraph and dont ask for any feedback at the end just sign off with a cute closing inviting the reader
	to create another adventure soon!
	"""

	prompt_template = ChatPromptTemplate.from_messages([("system", system), ("human", "{text}")])

	# FastAPI endpoint to generate the story
	@app.post("/generate_story/")
	async def generate_story(story_request: StoryRequest):
	story = f"""here are the inputs from user:
	- Mood: {story_request.mood}
	- Story Type: {story_request.story_type}
	- Theme: {story_request.theme}
	- Details Provided: {story_request.txt}
	"""

	response = llm.create_chat_completion(
	messages = [
	{"role": "system", "content": system},
	{"role": "user","content": story}
	]
	)

	# final_prompt = prompt_template.format(text=story)

	# # Create the LLMChain
	# # chain = LLMChain(llm=llm, prompt=prompt_template)
	# chain = llm \| prompt_template

	# # try:
	# # response = chain.invoke(final_prompt)
	# # return {"story": response}
	# # except Exception as e:
	# # raise HTTPException(status_code=500, detail=str(e))
	# response = chain.invoke(final_prompt)



	if not response:
	raise HTTPException(status_code=500, detail="Failed to generate the story")

	images = []
	for i in range(story_request.num_scenes):
	# image_prompt = f"Generate an image for Scene {i+1} based on this story: Mood: {story_request.mood}, Story Type: {story_request.story_type}, Theme: {story_request.theme}. Story: {response}"
	image_prompt = (
	f"Generate an image for Scene {i+1}. "
	f"This image should represent the details described in paragraph {i+1} of the story. "
	f"Mood: {story_request.mood}, Story Type: {', '.join(story_request.story_type)}, Theme: {story_request.theme}. "
	f"Story: {response} "
	f"Focus on the key elements in paragraph {i+1}."
	)
	handler = fal_client.submit(
	"fal-ai/flux/schnell",
	arguments={
	"prompt": image_prompt,
	"num_images": 1,
	"enable_safety_checker": True
	},
	)
	result = handler.get()
	image_url = result['images'][0]['url']
	images.append(image_url)

	return {
	"story": response,
	"images": images
	}