Spaces:
Sleeping
Sleeping
Update app/app.py
Browse files- app/app.py +13 -9
app/app.py
CHANGED
|
@@ -7,24 +7,28 @@ import requests
|
|
| 7 |
from app.policy_vector_db import PolicyVectorDB, ensure_db_populated
|
| 8 |
|
| 9 |
MODEL_URL = "https://huggingface.co/Kalpokoch/QuantizedFineTunedPhi1.5/resolve/main/dop-phi-1.5-Q4_K_M.gguf"
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
CHUNKS_PATH = "/app/processed_chunks_final.json"
|
| 13 |
|
| 14 |
# Download the model if not already present
|
| 15 |
def download_model():
|
| 16 |
if not os.path.exists(MODEL_PATH):
|
|
|
|
| 17 |
print("🔽 Downloading model...")
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
|
| 24 |
download_model()
|
| 25 |
|
| 26 |
# Initialize model and vector database
|
| 27 |
-
llm = Llama(model_path=MODEL_PATH, n_ctx=2048)
|
| 28 |
vector_db = PolicyVectorDB(CHUNKS_PATH)
|
| 29 |
ensure_db_populated(vector_db)
|
| 30 |
|
|
|
|
| 7 |
from app.policy_vector_db import PolicyVectorDB, ensure_db_populated
|
| 8 |
|
| 9 |
MODEL_URL = "https://huggingface.co/Kalpokoch/QuantizedFineTunedPhi1.5/resolve/main/dop-phi-1.5-Q4_K_M.gguf"
|
| 10 |
+
MODEL_PATH = "/tmp/models/dop-phi-1.5-Q4_K_M.gguf"
|
| 11 |
+
CHUNKS_PATH = "/app/processed_chunks.json"
|
|
|
|
| 12 |
|
| 13 |
# Download the model if not already present
|
| 14 |
def download_model():
|
| 15 |
if not os.path.exists(MODEL_PATH):
|
| 16 |
+
os.makedirs(os.path.dirname(MODEL_PATH), exist_ok=True)
|
| 17 |
print("🔽 Downloading model...")
|
| 18 |
+
url = "https://huggingface.co/Kalpokoch/QuantizedFineTunedPhi1.5/resolve/main/dop-phi-1.5-Q4_K_M.gguf"
|
| 19 |
+
response = requests.get(url, stream=True)
|
| 20 |
+
if response.status_code == 200:
|
| 21 |
+
with open(MODEL_PATH, "wb") as f:
|
| 22 |
+
for chunk in response.iter_content(chunk_size=8192):
|
| 23 |
+
f.write(chunk)
|
| 24 |
+
print("✅ Model downloaded successfully.")
|
| 25 |
+
else:
|
| 26 |
+
raise Exception(f"Failed to download model: {response.status_code}")
|
| 27 |
|
| 28 |
download_model()
|
| 29 |
|
| 30 |
# Initialize model and vector database
|
| 31 |
+
llm = Llama(model_path=MODEL_PATH, n_ctx=2048, n_threads=4)
|
| 32 |
vector_db = PolicyVectorDB(CHUNKS_PATH)
|
| 33 |
ensure_db_populated(vector_db)
|
| 34 |
|