amitbhatt6075 commited on
Commit
aa50189
·
1 Parent(s): f507f45

refactor(core): Switch to TinyLlama to resolve memory issues

Browse files
Files changed (1) hide show
  1. api/main.py +2 -2
api/main.py CHANGED
@@ -45,8 +45,8 @@ ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
45
  MODELS_DIR = os.path.join(ROOT_DIR, 'models')
46
 
47
  # ✅ FIX: Swapped to a smaller, memory-friendly model to avoid crashing on free tier
48
- MODEL_REPO = "TheBloke/phi-2-GGUF"
49
- MODEL_FILENAME = "phi-2.Q2_K.gguf"
50
 
51
  MODEL_SAVE_DIRECTORY = os.path.join(os.environ.get("WRITABLE_DIR", "/data"), "llm_model")
52
  LLAMA_MODEL_PATH = os.path.join(MODEL_SAVE_DIRECTORY, MODEL_FILENAME)
 
45
  MODELS_DIR = os.path.join(ROOT_DIR, 'models')
46
 
47
  # ✅ FIX: Swapped to a smaller, memory-friendly model to avoid crashing on free tier
48
+ MODEL_REPO = "TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF"
49
+ MODEL_FILENAME = "tinyllama-1.1b-chat-v1.0.Q2_K.gguf"
50
 
51
  MODEL_SAVE_DIRECTORY = os.path.join(os.environ.get("WRITABLE_DIR", "/data"), "llm_model")
52
  LLAMA_MODEL_PATH = os.path.join(MODEL_SAVE_DIRECTORY, MODEL_FILENAME)