Spaces:

THEZYZSTUDIO
/

Minecraft_java_server

Paused

App Files Files Community

THEZYZSTUDIO commited on Jan 3

Commit

65dc97e

verified ·

1 Parent(s): 8daf7ab

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -6

app.py CHANGED Viewed

@@ -4,8 +4,8 @@ from llama_cpp import Llama
 import base64
 import json
-REPO_ID = "bartowski/Nanbeige_Nanbeige4-3B-Thinking-2511-GGUF"
-FILENAME = "Nanbeige_Nanbeige4-3B-Thinking-2511-bf16.gguf"
 print("🚀 Starting THE Z AI Server...", flush=True)
@@ -16,7 +16,7 @@ def load_model():
     try:
         print("📥 Downloading Model...", flush=True)
         model_path = hf_hub_download(repo_id=REPO_ID, filename=FILENAME)
-        llm = Llama(model_path=model_path, n_ctx=80000, n_threads=2, verbose=False)
         print("✅ Model Ready!", flush=True)
         return True
     except Exception as e:
@@ -49,7 +49,7 @@ def chat(message, history_json, system_info, file_content):
         else:
             messages.append({
                 "role": "system",
-                "content": "First, your name is THE Z AI THINKER and the name of the company that created you is THE ZYZ STUDIO When you think, you must think in the user's language, and the answer must also be in the user's language. Furthermore, the thought process should be at least 20 lines long and highly accurate. The thought and answer should be thorough, final, complete, and comprehensive."
             })
         for h in history:
@@ -64,8 +64,10 @@ def chat(message, history_json, system_info, file_content):
         response_obj = llm.create_chat_completion(
             messages=messages,
-            max_tokens=7000,
-            temperature=0.7
         )
         response = response_obj['choices'][0]['message']['content'].strip()

 import base64
 import json
+REPO_ID = "prithivMLmods/OpenRHO-2B-Thinker-GGUF"
+FILENAME = "OpenRHO-2B-Thinker.F32.gguf"
 print("🚀 Starting THE Z AI Server...", flush=True)
     try:
         print("📥 Downloading Model...", flush=True)
         model_path = hf_hub_download(repo_id=REPO_ID, filename=FILENAME)
+        llm = Llama(model_path=model_path, n_ctx=150000, n_threads=4, verbose=False)
         print("✅ Model Ready!", flush=True)
         return True
     except Exception as e:
         else:
             messages.append({
                 "role": "system",
+                "content": "First, your name is THE Z AI THINKER and the name of the company that created you is THE ZYZ STUDIO When you think, you must think in the user's language, and the answer must also be in the user's language. Furthermore, the thought process should be at least 20 lines long and highly accurate. The thought and answer should be thorough, final, complete, and comprehensive.Do not repeat the same word or phrase more than once. Text should be clear and free of repetition. Try not to make mistakes in your answers, and mentally write the answer before presenting it to the user. Ensure it is not incorrect or contains unnecessary repetition that could damage the sentence or the message you are conveying to the user. If it is Corden, for example, you can repeat something because it is important, but do so correctly and not carelessly. Something very, very important: you are a specialist in thinking, so try to think a lot and understand every word the user said to you."
             })
         for h in history:
         response_obj = llm.create_chat_completion(
             messages=messages,
+            max_tokens=15000,
+            temperature=0.7,
+            top_k=40,
+            top_p=0.95
         )
         response = response_obj['choices'][0]['message']['content'].strip()