Spaces:

Fred808
/

control1

Paused

Fred808 commited on Oct 13, 2025

Commit

ca8b343

verified ·

1 Parent(s): 7bcdb30

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -144,9 +144,18 @@ async def split_model_weights():
         import torch
         import math
-        # Load the full model weights without forcing CPU - let tensor servers handle device placement
         model_file = next(f for f in state.model_files.values() if f.endswith('.safetensors') or f.endswith('.bin'))
-        weights = torch.load(model_file, weights_only=False)  # Explicitly allow non-weights for compatibility
         # Calculate total model size and chunks
         total_size_bytes = sum(p.nelement() * p.element_size() for p in weights.values())

         import torch
         import math
+        # Load the full model weights
         model_file = next(f for f in state.model_files.values() if f.endswith('.safetensors') or f.endswith('.bin'))
+        loaded_weights = torch.load(model_file, weights_only=False)  # Explicitly allow non-weights for compatibility
+        # For OPT models, weights are stored under model.decoder
+        if isinstance(loaded_weights, dict):
+            if 'model.decoder' in str(list(loaded_weights.keys())):
+                # Get all weights that are part of the decoder
+                weights = {k: v for k, v in loaded_weights.items() if k.startswith('model.decoder')}
+            else:
+                # Just use all weights if no decoder prefix found
+                weights = loaded_weights
         # Calculate total model size and chunks
         total_size_bytes = sum(p.nelement() * p.element_size() for p in weights.values())