Spaces:

tjwrld
/

llm-cpu-server

Sleeping

App Files Files Community

tjwrld commited on Mar 17

Commit

141facc

verified ·

1 Parent(s): 2b9b303

Update server.js

Browse files

Files changed (1) hide show

server.js +15 -7

server.js CHANGED Viewed

@@ -51,27 +51,31 @@ async function initModel() {
 ----------------------- */
 app.post("/generate", async (req, res) => {
-    // 1. Check if the model is still loading in the background
     if (!isModelReady) {
         return res.status(503).json({
             error: "The AI model is still loading into memory. Please wait a few seconds and try again."
         });
     }
     try {
         const {
             user_input,
-            user_temp = 0.7,
-            user_inst = "You are an AI assistant. Give short clear answers.",
-            user_max_token = 512
         } = req.body;
         if (!user_input) {
             return res.status(400).json({ error: "Missing required field: user_input" });
         }
         const session = new LlamaChatSession({
-            contextSequence: contextInstance.getSequence(),
             systemPrompt: user_inst
         });
@@ -88,6 +92,11 @@ app.post("/generate", async (req, res) => {
     } catch (err) {
         console.error("Error during generation:", err);
         res.status(500).json({ error: "An internal error occurred during text generation." });
     }
 });
@@ -95,12 +104,11 @@ app.post("/generate", async (req, res) => {
    STARTUP SEQUENCE
 ----------------------- */
-// 1. START THE SERVER IMMEDIATELY (This satisfies Hugging Face's health check)
 app.listen(PORT, "0.0.0.0", () => {
     console.log(`✅ Web server is listening on port ${PORT}`);
     console.log(`⏳ Starting background model load...`);
-    // 2. LOAD THE MODEL IN THE BACKGROUND
     initModel().catch(err => {
         console.error("Critical Failure: Failed to load the AI model.", err);
     });

 ----------------------- */
 app.post("/generate", async (req, res) => {
     if (!isModelReady) {
         return res.status(503).json({
             error: "The AI model is still loading into memory. Please wait a few seconds and try again."
         });
     }
+    let sequence; // Define this here so we can clean it up in the 'finally' block
     try {
         const {
             user_input,
+            user_temp = 0.2,
+            user_inst = "You are an Wrld-Gpt AI assistant. Give short clear answers. Do not make assumptions",
+            user_max_token = 1024
         } = req.body;
         if (!user_input) {
             return res.status(400).json({ error: "Missing required field: user_input" });
         }
+        // Grab a sequence memory slot for this specific request
+        sequence = contextInstance.getSequence();
         const session = new LlamaChatSession({
+            contextSequence: sequence,
             systemPrompt: user_inst
         });
     } catch (err) {
         console.error("Error during generation:", err);
         res.status(500).json({ error: "An internal error occurred during text generation." });
+    } finally {
+        // CRITICAL FIX: Always free up the sequence slot when done, even if an error occurs!
+        if (sequence) {
+            sequence.dispose();
+        }
     }
 });
    STARTUP SEQUENCE
 ----------------------- */
 app.listen(PORT, "0.0.0.0", () => {
     console.log(`✅ Web server is listening on port ${PORT}`);
     console.log(`⏳ Starting background model load...`);
+    //LOAD THE MODEL IN THE BACKGROUND
     initModel().catch(err => {
         console.error("Critical Failure: Failed to load the AI model.", err);
     });