Spaces:

apehex
/

de-generate

Sleeping

apehex commited on Mar 13

Commit

2699bf3

1 Parent(s): 75344c6

Download the models without instantiating them.

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import gradio
 import spaces
 import psaiops.common.model
@@ -9,12 +10,13 @@ import psaiops.score.human.app as _app
 # META #########################################################################
 # additional args used when loading the model
-_CONFIG = {}
 _app.MODELS = ['qwen/qwen3.5-9b', 'qwen/qwen3.5-27b']
 # frontload the models on the CPU to avoid downloading them from the GPU slot
 for __m in _app.MODELS:
-    psaiops.common.model.get_model(name=__m, device='cpu', **_CONFIG)
 # but do not instantiate unless necessary
 _MODEL = None
@@ -34,7 +36,7 @@ def fetch_model() -> object:
     global _MODEL
     # control when the model is downloaded to avoid moving it to the CPU
     if _MODEL is None:
-        _MODEL = psaiops.common.model.get_model(name=_app.MODELS[0], device='cuda', **_CONFIG)
     # tuple of objects or (None, None)
     return _MODEL

 import gradio
+import huggingface_hub
 import spaces
 import psaiops.common.model
 # META #########################################################################
 # additional args used when loading the model
+_MODEL_CFG = {}
+_LOAD_CFG = {'repo_type': 'model', 'ignore_patterns': ['*.onnx', '*.tflite', '*.msgpack'],}
 _app.MODELS = ['qwen/qwen3.5-9b', 'qwen/qwen3.5-27b']
 # frontload the models on the CPU to avoid downloading them from the GPU slot
 for __m in _app.MODELS:
+    huggingface_hub.snapshot_download(repo_id=__m, **_LOAD_CFG)
 # but do not instantiate unless necessary
 _MODEL = None
     global _MODEL
     # control when the model is downloaded to avoid moving it to the CPU
     if _MODEL is None:
+        _MODEL = psaiops.common.model.get_model(name=_app.MODELS[0], device='cuda', **_MODEL_CFG)
     # tuple of objects or (None, None)
     return _MODEL

requirements.txt CHANGED Viewed

@@ -1,5 +1,6 @@
 accelerate>=1.11
 gradio>=6.0
 kernels>=0.11
 psaiops>=0.10.3
 spaces>=0.47

 accelerate>=1.11
 gradio>=6.0
+huggingface_hub>=1.5
 kernels>=0.11
 psaiops>=0.10.3
 spaces>=0.47