Spaces:

ostarling
/

MiniMax-M2.5-Chat

Running

ostarling commited on 21 days ago

Commit

30ed0b7

verified ·

1 Parent(s): 852c5e1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,10 @@ from huggingface_hub import InferenceClient
 MODEL_ID = "MiniMaxAI/MiniMax-M2.5"
 SYSTEM_PROMPT = "You are a helpful assistant. Your name is MiniMax-M2.5 and is built by MiniMax."
-client = InferenceClient(MODEL_ID, token=os.environ.get("HF_TOKEN"))
 def respond(message, history, system_message, max_tokens, temperature, top_p):
@@ -21,7 +24,8 @@ def respond(message, history, system_message, max_tokens, temperature, top_p):
     response = ""
     for chunk in client.chat_completion(
-        messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,

 MODEL_ID = "MiniMaxAI/MiniMax-M2.5"
 SYSTEM_PROMPT = "You are a helpful assistant. Your name is MiniMax-M2.5 and is built by MiniMax."
+client = InferenceClient(
+    provider="novita",
+    api_key=os.environ.get("HF_TOKEN"),
+)
 def respond(message, history, system_message, max_tokens, temperature, top_p):
     response = ""
     for chunk in client.chat_completion(
+        MODEL_ID,
+        messages=messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,