Spaces:

therandomuser03
/

psypredict-backend

Sleeping

App Files Files Community

therandomuser03 commited on Mar 8

Commit

8d1fac5

1 Parent(s): 561a3db

update backend - HF

Browse files

Files changed (4) hide show

Dockerfile +1 -0
app/services/crisis_engine.py +6 -2
app/services/text_emotion_engine.py +7 -2
download_models.py +28 -1

Dockerfile CHANGED Viewed

@@ -40,6 +40,7 @@ RUN python download_models.py
 # 9. Environment & Port settings (7860 is HF Spaces standard)
 ENV PYTHONPATH=/app
 ENV USE_EMBEDDED_LLM=True
 EXPOSE 7860
 # 10. Run the app with Uvicorn

 # 9. Environment & Port settings (7860 is HF Spaces standard)
 ENV PYTHONPATH=/app
 ENV USE_EMBEDDED_LLM=True
+ENV HF_HUB_OFFLINE=1
 EXPOSE 7860
 # 10. Run the app with Uvicorn

app/services/crisis_engine.py CHANGED Viewed

@@ -63,10 +63,14 @@ def initialize_crisis_classifier() -> None:
     global _zero_shot_pipeline, _load_error
     try:
         from transformers import pipeline as hf_pipeline
-        logger.info("Loading crisis zero-shot classifier...")
         _zero_shot_pipeline = hf_pipeline(
             "zero-shot-classification",
-            model="cross-encoder/nli-MiniLM2-L6-H768",
             device=-1,  # CPU
         )
         logger.info("✅ Crisis classifier loaded.")

     global _zero_shot_pipeline, _load_error
     try:
         from transformers import pipeline as hf_pipeline
+        import os
+        local_path = os.path.join("app", "ml_assets", "crisis_model")
+        logger.info("Loading crisis zero-shot classifier from %s", local_path)
         _zero_shot_pipeline = hf_pipeline(
             "zero-shot-classification",
+            model=local_path if os.path.exists(local_path) else "cross-encoder/nli-MiniLM2-L6-H768",
             device=-1,  # CPU
         )
         logger.info("✅ Crisis classifier loaded.")

app/services/text_emotion_engine.py CHANGED Viewed

@@ -23,10 +23,15 @@ def _load_pipeline(model_name: str) -> None:
     global _pipeline, _load_error
     try:
         from transformers import pipeline as hf_pipeline
-        logger.info("Loading DistilBERT text emotion model: %s", model_name)
         _pipeline = hf_pipeline(
             "text-classification",
-            model=model_name,
             top_k=None,           # Return ALL labels
             truncation=True,
             max_length=512,

     global _pipeline, _load_error
     try:
         from transformers import pipeline as hf_pipeline
+        import os
+        # Determine local path
+        local_path = os.path.join("app", "ml_assets", "distilbert_model")
+        logger.info("Loading DistilBERT text emotion model from %s", local_path)
         _pipeline = hf_pipeline(
             "text-classification",
+            model=local_path if os.path.exists(local_path) else model_name,
             top_k=None,           # Return ALL labels
             truncation=True,
             max_length=512,

download_models.py CHANGED Viewed

@@ -16,6 +16,13 @@ FACE_MODEL_PATH = os.path.join(ML_ASSETS, "emotion_model_trained.h5")
 MEDS_CSV_PATH = os.path.join(ML_ASSETS, "MEDICATION.csv")
 LLAMA_GGUF_PATH = os.path.join(ML_ASSETS, "llama-3-8b-instruct.Q4_K_M.gguf")
 def download_drive_file(file_id, output_path):
     if not os.path.exists(output_path):
         os.makedirs(os.path.dirname(output_path), exist_ok=True)
@@ -42,6 +49,19 @@ def download_hf_model(repo_id, filename, output_path):
     else:
         print(f"✅ Found {output_path}, skipping.")
 if __name__ == "__main__":
     print("🚀 Starting Production Model Sync...")
@@ -53,6 +73,13 @@ if __name__ == "__main__":
     try:
         download_hf_model(LLAMA_REPO, LLAMA_FILE, LLAMA_GGUF_PATH)
     except Exception as e:
-        print(f"⚠️ HF Download failed (expected on local dev if no internet): {e}")
     print("✅ All models synchronized!")

 MEDS_CSV_PATH = os.path.join(ML_ASSETS, "MEDICATION.csv")
 LLAMA_GGUF_PATH = os.path.join(ML_ASSETS, "llama-3-8b-instruct.Q4_K_M.gguf")
+# HF Transformers (Downloaded via snapshot_download for full directory)
+CRISIS_MODEL_REPO = "cross-encoder/nli-MiniLM2-L6-H768"
+DISTILBERT_MODEL_REPO = "bhadresh-savani/distilbert-base-uncased-emotion"
+CRISIS_MODEL_PATH = os.path.join(ML_ASSETS, "crisis_model")
+DISTILBERT_MODEL_PATH = os.path.join(ML_ASSETS, "distilbert_model")
 def download_drive_file(file_id, output_path):
     if not os.path.exists(output_path):
         os.makedirs(os.path.dirname(output_path), exist_ok=True)
     else:
         print(f"✅ Found {output_path}, skipping.")
+def download_hf_directory(repo_id, output_dir):
+    from huggingface_hub import snapshot_download
+    if not os.path.exists(output_dir) or not os.listdir(output_dir):
+        print(f"⬇️ Downloading HF repo: {repo_id} to {output_dir}...")
+        snapshot_download(
+            repo_id=repo_id,
+            local_dir=output_dir,
+            local_dir_use_symlinks=False,
+            ignore_patterns=["*.msgpack", "*.h5", "*.ot", "rust_model.ot"] # save space, only PyTorch/Safetensors needed
+        )
+    else:
+        print(f"✅ Found {output_dir}, skipping.")
 if __name__ == "__main__":
     print("🚀 Starting Production Model Sync...")
     try:
         download_hf_model(LLAMA_REPO, LLAMA_FILE, LLAMA_GGUF_PATH)
     except Exception as e:
+        print(f"⚠️ HF LLaMA Download failed (expected on local dev if no internet): {e}")
+    # 3. HF Transformers Pipeline Models
+    try:
+        download_hf_directory(CRISIS_MODEL_REPO, CRISIS_MODEL_PATH)
+        download_hf_directory(DISTILBERT_MODEL_REPO, DISTILBERT_MODEL_PATH)
+    except Exception as e:
+        print(f"⚠️ HF Transformers Download failed: {e}")
     print("✅ All models synchronized!")