Spaces:

Drakkarious
/

hackerai

Sleeping

Drakkarious commited on Apr 23

Commit

399b95d

verified ·

1 Parent(s): b7bb791

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,44 +6,45 @@ from llama_cpp import Llama
 # 1. Faster downloads
 os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
-# 2. Define local paths
 CACHE_DIR = os.path.join(os.getcwd(), "model_cache")
-print("--- Starting AI Sandbox ---")
 try:
-    print("--- Downloading 26B Model (16.7GB) to local cache ---")
     model_path = hf_hub_download(
         repo_id="BugTraceAI/BugTraceAI-Apex-G4-26B-Q4",
         filename="BugTraceAI-Apex-G4-26B-Q4.gguf",
         cache_dir=CACHE_DIR
     )
-    print(f"--- Loading Model: {model_path} ---")
-    # Low-RAM configuration for Free Tier
     llm = Llama(
         model_path=model_path,
         n_ctx=2048,
         n_threads=2,
-        use_mmap=True, # Critical for large models on 16GB RAM
-        n_gpu_layers=0 # CPU Only
     )
-    def chat(prompt):
         output = llm(
-            f"User: {prompt}\nAssistant:",
             max_tokens=256,
             stop=["User:", "\n"],
             echo=False
         )
-        return output["choices"][0]["text"]
-    print("\n✅ Sandbox Ready!")
-    print("To chat, use the logs terminal or call: chat('your prompt')")
-    # Keeps the container alive and interactive
-    import IPython
-    IPython.embed()
 except Exception as e:
-    print(f"❌ Error during startup: {e}")
     sys.exit(1)

 # 1. Faster downloads
 os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
 CACHE_DIR = os.path.join(os.getcwd(), "model_cache")
+print("--- Initializing AI Sandbox ---")
 try:
+    print("--- Downloading Model (16.7GB)... This will take a moment. ---")
     model_path = hf_hub_download(
         repo_id="BugTraceAI/BugTraceAI-Apex-G4-26B-Q4",
         filename="BugTraceAI-Apex-G4-26B-Q4.gguf",
         cache_dir=CACHE_DIR
     )
+    print(f"--- Loading Model into RAM (mmap enabled) ---")
     llm = Llama(
         model_path=model_path,
         n_ctx=2048,
         n_threads=2,
+        use_mmap=True,
+        n_gpu_layers=0
     )
+    print("\n✅ SANDBOX READY")
+    print("------------------------------------------")
+    print("Enter your prompt below. Type 'exit' to quit.")
+    # Standard terminal loop (Stable for Docker Logs)
+    while True:
+        user_input = input("\n[Terminal] User: ")
+        if user_input.lower() in ["exit", "quit"]:
+            break
         output = llm(
+            f"User: {user_input}\nAssistant:",
             max_tokens=256,
             stop=["User:", "\n"],
             echo=False
         )
+        print(f"Assistant: {output['choices'][0]['text']}")
 except Exception as e:
+    print(f"❌ CRITICAL ERROR: {e}")
     sys.exit(1)