Kalpokoch commited on
Commit
848fa19
·
verified ·
1 Parent(s): 81212b1

Update app/app.py

Browse files
Files changed (1) hide show
  1. app/app.py +13 -9
app/app.py CHANGED
@@ -7,24 +7,28 @@ import requests
7
  from app.policy_vector_db import PolicyVectorDB, ensure_db_populated
8
 
9
  MODEL_URL = "https://huggingface.co/Kalpokoch/QuantizedFineTunedPhi1.5/resolve/main/dop-phi-1.5-Q4_K_M.gguf"
10
- MODEL_DIR = "/app/models"
11
- MODEL_PATH = os.path.join(MODEL_DIR, "dop-phi-1.5-Q4_K_M.gguf")
12
- CHUNKS_PATH = "/app/processed_chunks_final.json"
13
 
14
  # Download the model if not already present
15
  def download_model():
16
  if not os.path.exists(MODEL_PATH):
 
17
  print("🔽 Downloading model...")
18
- response = requests.get(MODEL_URL, stream=True)
19
- with open(MODEL_PATH, "wb") as f:
20
- for chunk in response.iter_content(chunk_size=8192):
21
- f.write(chunk)
22
- print("✅ Model downloaded.")
 
 
 
 
23
 
24
  download_model()
25
 
26
  # Initialize model and vector database
27
- llm = Llama(model_path=MODEL_PATH, n_ctx=2048)
28
  vector_db = PolicyVectorDB(CHUNKS_PATH)
29
  ensure_db_populated(vector_db)
30
 
 
7
  from app.policy_vector_db import PolicyVectorDB, ensure_db_populated
8
 
9
  MODEL_URL = "https://huggingface.co/Kalpokoch/QuantizedFineTunedPhi1.5/resolve/main/dop-phi-1.5-Q4_K_M.gguf"
10
+ MODEL_PATH = "/tmp/models/dop-phi-1.5-Q4_K_M.gguf"
11
+ CHUNKS_PATH = "/app/processed_chunks.json"
 
12
 
13
  # Download the model if not already present
14
  def download_model():
15
  if not os.path.exists(MODEL_PATH):
16
+ os.makedirs(os.path.dirname(MODEL_PATH), exist_ok=True)
17
  print("🔽 Downloading model...")
18
+ url = "https://huggingface.co/Kalpokoch/QuantizedFineTunedPhi1.5/resolve/main/dop-phi-1.5-Q4_K_M.gguf"
19
+ response = requests.get(url, stream=True)
20
+ if response.status_code == 200:
21
+ with open(MODEL_PATH, "wb") as f:
22
+ for chunk in response.iter_content(chunk_size=8192):
23
+ f.write(chunk)
24
+ print("✅ Model downloaded successfully.")
25
+ else:
26
+ raise Exception(f"Failed to download model: {response.status_code}")
27
 
28
  download_model()
29
 
30
  # Initialize model and vector database
31
+ llm = Llama(model_path=MODEL_PATH, n_ctx=2048, n_threads=4)
32
  vector_db = PolicyVectorDB(CHUNKS_PATH)
33
  ensure_db_populated(vector_db)
34