Spaces:

Tech-Meld
/

Hajax_Chat_Official

Sleeping

Tech-Meld commited on Jun 12, 2024

Commit

fa136e4

verified ·

1 Parent(s): 6bc76bb

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,8 +1,8 @@
 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer
-@gr.cache(allow_output_mutation=True)
 def load_model():
     model_id = "Tech-Meld/Hajax_Chat_1.0"
     tokenizer = AutoTokenizer.from_pretrained(model_id)
@@ -15,17 +15,20 @@ def get_response(input_text, model, tokenizer):
     response = tokenizer.decode(outputs[:, inputs.shape[-1]:][0], skip_special_tokens=True)
     return response
-model, tokenizer = load_model()
 def chat(input_text):
-  response = get_response(input_text, model, tokenizer)
-  return response
 iface = gr.Interface(
     chat,
     "text",
     "text",
-    title="Chat with Hajax",
     description="Type your message and press Enter to chat with the AI.",
 )
 iface.launch()

 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer
+model_cache = {}
 def load_model():
     model_id = "Tech-Meld/Hajax_Chat_1.0"
     tokenizer = AutoTokenizer.from_pretrained(model_id)
     response = tokenizer.decode(outputs[:, inputs.shape[-1]:][0], skip_special_tokens=True)
     return response
 def chat(input_text):
+    global model_cache
+    if "model" not in model_cache:
+        model_cache["model"], model_cache["tokenizer"] = load_model()
+    model = model_cache["model"]
+    tokenizer = model_cache["tokenizer"]
+    response = get_response(input_text, model, tokenizer)
+    return response
 iface = gr.Interface(
     chat,
     "text",
     "text",
+    title="Chat with AI",
     description="Type your message and press Enter to chat with the AI.",
 )
 iface.launch()