Spaces:

Nishan30
/

n8n-workflow-generator-app

Running

Nishan30 commited on 8 days ago

Commit

10104ce

verified ·

1 Parent(s): 8a622dc

Upload app.py with huggingface_hub

Files changed (1) hide show

app.py CHANGED Viewed

@@ -28,11 +28,12 @@ def load_model():
     """Load model once and cache it"""
     print("Loading model...")
-    # Prepare model loading kwargs
     model_kwargs = {
         "device_map": "auto",
         "trust_remote_code": True,
         "low_cpu_mem_usage": True,
     }
     # Use 8-bit quantization if enabled (saves memory)

     """Load model once and cache it"""
     print("Loading model...")
+    # Prepare model loading kwargs with disk offloading for limited memory
     model_kwargs = {
         "device_map": "auto",
         "trust_remote_code": True,
         "low_cpu_mem_usage": True,
+        "offload_folder": "offload",  # Enable disk offloading for HF Space
     }
     # Use 8-bit quantization if enabled (saves memory)