Commit
·
aa50189
1
Parent(s):
f507f45
refactor(core): Switch to TinyLlama to resolve memory issues
Browse files- api/main.py +2 -2
api/main.py
CHANGED
|
@@ -45,8 +45,8 @@ ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
|
|
| 45 |
MODELS_DIR = os.path.join(ROOT_DIR, 'models')
|
| 46 |
|
| 47 |
# ✅ FIX: Swapped to a smaller, memory-friendly model to avoid crashing on free tier
|
| 48 |
-
MODEL_REPO = "TheBloke/
|
| 49 |
-
MODEL_FILENAME = "
|
| 50 |
|
| 51 |
MODEL_SAVE_DIRECTORY = os.path.join(os.environ.get("WRITABLE_DIR", "/data"), "llm_model")
|
| 52 |
LLAMA_MODEL_PATH = os.path.join(MODEL_SAVE_DIRECTORY, MODEL_FILENAME)
|
|
|
|
| 45 |
MODELS_DIR = os.path.join(ROOT_DIR, 'models')
|
| 46 |
|
| 47 |
# ✅ FIX: Swapped to a smaller, memory-friendly model to avoid crashing on free tier
|
| 48 |
+
MODEL_REPO = "TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF"
|
| 49 |
+
MODEL_FILENAME = "tinyllama-1.1b-chat-v1.0.Q2_K.gguf"
|
| 50 |
|
| 51 |
MODEL_SAVE_DIRECTORY = os.path.join(os.environ.get("WRITABLE_DIR", "/data"), "llm_model")
|
| 52 |
LLAMA_MODEL_PATH = os.path.join(MODEL_SAVE_DIRECTORY, MODEL_FILENAME)
|