Spaces:

Juna190825
/

mylocalmodels

Runtime error

Juna190825 commited on Aug 11, 2025

Commit

3c3fb04

verified ·

1 Parent(s): d8d0f11

Update Dockerfile

Files changed (1) hide show

app.py CHANGED Viewed

@@ -128,33 +128,29 @@ CACHE_DIR = "/cache/models"
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 def load_model():
-    """Load model directly, attempting cache first"""
     try:
-        # Try loading from cache
-        print("Attempting to load from cache...")
-        model = AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR,
-            local_files_only=True  # Force cache usage
-        ).to(DEVICE)
-        tokenizer = AutoTokenizer.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR,
             local_files_only=True
         )
     except OSError:
-        # Fallback to download if cache missing
-        print("Cache not found, downloading...")
-        model = AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR
-        ).to(DEVICE)
-        tokenizer = AutoTokenizer.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR
         )
-    return model, tokenizer
 # Load model
 model, tokenizer = load_model()

 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 def load_model():
+    """Load model with automatic cache handling"""
     try:
+        # First try with local files only (uses cache if available)
+        print("Checking for cached model...")
+        return AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR,
+            local_files_only=True  # Will fail if not cached
+        ).to(DEVICE), AutoTokenizer.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR,
             local_files_only=True
         )
     except OSError:
+        # Fallback to download if not in cache
+        print("Downloading model...")
+        return AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR
+        ).to(DEVICE), AutoTokenizer.from_pretrained(
             MODEL_ID,
             cache_dir=CACHE_DIR
         )
 # Load model
 model, tokenizer = load_model()