SmallZOO-GGUFee-Llama

Running

expandme commited on Dec 6, 2024

Commit

5d478c9

1 Parent(s): 154242e

Adding chat format to Models ? - What wind.surf will do ?

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,11 +6,13 @@ import requests
 MODELS = {
     "Llama-3.2-3B": {
         "repo_id": "lmstudio-community/Llama-3.2-3B-Instruct-GGUF",
-        "filename": "*Q4_K_M.gguf"
     },
-    "Llama-3.2-1.5B": {
         "repo_id": "lmstudio-community/Llama-3.2-1B-Instruct-GGUF",
-        "filename": "*Q4_K_M.gguf"
     }
 }
@@ -26,7 +28,7 @@ def load_model(model_name):
         verbose=True,
         n_ctx=32768,
         n_threads=2,
-        chat_format="chatml"
     )
     return current_model
@@ -74,7 +76,7 @@ def respond(
         yield message_repl
 def get_chat_title(model_name):
-    return f"{model_name} - load other model in advanced settings"
 demo = gr.ChatInterface(
     respond,

 MODELS = {
     "Llama-3.2-3B": {
         "repo_id": "lmstudio-community/Llama-3.2-3B-Instruct-GGUF",
+        "filename": "*Q4_K_M.gguf",
+        "chat_format": "chatml"
     },
+    "Llama-3.2-5B": {
         "repo_id": "lmstudio-community/Llama-3.2-1B-Instruct-GGUF",
+        "filename": "*Q4_K_M.gguf",
+        "chat_format": "chatml"
     }
 }
         verbose=True,
         n_ctx=32768,
         n_threads=2,
+        chat_format=model_info["chat_format"]
     )
     return current_model
         yield message_repl
 def get_chat_title(model_name):
+    return f"{model_name} < - Load different model in Additional Inputs"
 demo = gr.ChatInterface(
     respond,