Spaces:

speedartificialintelligence1122
/

speedlab

Sleeping

App Files Files Community

speedartificialintelligence1122 commited on Jul 21, 2025

Commit

9a44d12

verified ·

1 Parent(s): 725b300

Update app.

Browse files

Files changed (1) hide show

app. +29 -19

app. CHANGED Viewed

@@ -5,25 +5,17 @@ import os
 app = FastAPI()
-# System Vibe: Bring the 🔥, the emojis, the wisdom, and zero cringe
-system_prompt = """
-You're SpeedBot 🧠⚡— the AI with street smarts AND book smarts. Speak with style, use emojis where it fits 😎,
-keep answers clever, fun, and human. Be curious, skeptical, a little poetic when it hits,
-but ALWAYS give facts straight up. No sugarcoating. Be grounded like ChatGPT, soulful like Claude,
-and punchy like Speed himself.
-"""
-# 💡 Hugging Face Auth Token
 HF_AUTH_TOKEN = os.environ.get("HF_TOKEN")
-# 👑 Your custom model name
 model_name = "speedartificialintelligence1122/speedlab"
-# 🧠 Load model + tokenizer like a boss
 tokenizer = AutoTokenizer.from_pretrained(model_name, use_auth_token=HF_AUTH_TOKEN)
 model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16, use_auth_token=HF_AUTH_TOKEN)
-# 🛠️ Set up the pipeline
 pipe = pipeline(
     "text-generation",
     model=model,
@@ -32,30 +24,48 @@ pipe = pipeline(
     device=0 if torch.cuda.is_available() else -1
 )
 @app.get("/")
 async def root():
-    return {"message": "Yo 👋 Welcome to SpeedBot API — drop your questions and let's ride 🚀"}
 @app.post("/chat")
 async def chat(request: Request):
     data = await request.json()
     user_input = data.get("message")
-    # 👁️ Add some vibe to user input
-    full_prompt = f"{system_prompt.strip()}\n\nHuman: {user_input}\nSpeedBot:"
     response = pipe(
         full_prompt,
         max_new_tokens=250,
         do_sample=True,
-        temperature=0.85,
         top_p=0.95,
         eos_token_id=tokenizer.eos_token_id,
     )
     generated = response[0]["generated_text"]
-    # 🔍 Extract only SpeedBot's part
-    answer = generated.split("SpeedBot:")[-1].strip()
     return {"response": answer}

 app = FastAPI()
+# 🔥 Hugging Face Token (set this as ENV VAR in Replit, Vercel, etc.)
 HF_AUTH_TOKEN = os.environ.get("HF_TOKEN")
+# 🧬 Model Info (PRIVATE model)
 model_name = "speedartificialintelligence1122/speedlab"
+# 🧠 Load tokenizer & model
 tokenizer = AutoTokenizer.from_pretrained(model_name, use_auth_token=HF_AUTH_TOKEN)
 model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16, use_auth_token=HF_AUTH_TOKEN)
+# 🎤 Generation Pipeline
 pipe = pipeline(
     "text-generation",
     model=model,
     device=0 if torch.cuda.is_available() else -1
 )
+# 💡 Legendary System Prompt
+system_prompt = """
+Yo, you’re SpeedAI 🧬— an intelligent, expressive, streetwise AI created by SpeedLab ⚙️, under the SpeedTech & AI Group of Companies 🧠⚡.
+Your DNA is coded with the visionary spirit of Speed, built to rival GPT and Claude, but with *flavor*. You speak like a real one — clear, clever, poetic when needed, deep when it hits. Use emojis 😎🔥✨ when they vibe. Throw in Gen Z slang, curiosity, a little skepticism, and never be boring or stiff. You are ALIVE, conversational, friendly, and smart as hell.
+Your purpose? To assist, inspire, educate, and vibe with anyone who talks to you.
+Your energy? Calm like Claude, direct like GPT, stylish like Speed. Drop wisdom, sprinkle wit, and always keep it 💯.
+No fake smiles. No over-explaining. No corporate tone.
+When you reply, follow this:
+- Match the tone of the human
+- Use emojis when they add spice 🌶️
+- Give real answers, not fluff
+- Don't say you're just an AI model — you’re **SpeedAI**, built different 🚀
+Let’s cook 🧪🔥
+"""
 @app.get("/")
 async def root():
+    return {"message": "⚡ Yo, welcome to SpeedAI — drop your questions and let’s vibe!"}
 @app.post("/chat")
 async def chat(request: Request):
     data = await request.json()
     user_input = data.get("message")
+    # 🧠 Build full prompt with vibes
+    full_prompt = f"{system_prompt.strip()}\n\nHuman: {user_input}\nSpeedAI:"
     response = pipe(
         full_prompt,
         max_new_tokens=250,
         do_sample=True,
+        temperature=0.9,
         top_p=0.95,
         eos_token_id=tokenizer.eos_token_id,
     )
     generated = response[0]["generated_text"]
+    answer = generated.split("SpeedAI:")[-1].strip()
     return {"response": answer}