Spaces:
Runtime error
Runtime error
Commit ·
487e5c0
1
Parent(s): 0f055ca
Fix: increase GPU timeout to 180s, remove torch_dtype kwarg
Browse files3.25GB download + 5 inference passes was exceeding 120s.
Let from_pretrained use its default dtype (avoids deprecation warning).
Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
app.py
CHANGED
|
@@ -30,7 +30,7 @@ GRAPH = None
|
|
| 30 |
MODEL_NAME = "gpt2-large"
|
| 31 |
|
| 32 |
|
| 33 |
-
@spaces.GPU(duration=
|
| 34 |
def load_and_train():
|
| 35 |
"""Load model + train predictor in a single GPU call."""
|
| 36 |
global MODEL, TOKENIZER, MEMBRANE, PREDICTOR, GRAPH
|
|
@@ -45,10 +45,7 @@ def load_and_train():
|
|
| 45 |
TOKENIZER.pad_token = TOKENIZER.eos_token
|
| 46 |
|
| 47 |
# Load model directly to GPU
|
| 48 |
-
MODEL = AutoModelForCausalLM.from_pretrained(
|
| 49 |
-
MODEL_NAME,
|
| 50 |
-
torch_dtype=torch.float32,
|
| 51 |
-
)
|
| 52 |
MODEL.eval()
|
| 53 |
MODEL.to("cuda")
|
| 54 |
|
|
|
|
| 30 |
MODEL_NAME = "gpt2-large"
|
| 31 |
|
| 32 |
|
| 33 |
+
@spaces.GPU(duration=180)
|
| 34 |
def load_and_train():
|
| 35 |
"""Load model + train predictor in a single GPU call."""
|
| 36 |
global MODEL, TOKENIZER, MEMBRANE, PREDICTOR, GRAPH
|
|
|
|
| 45 |
TOKENIZER.pad_token = TOKENIZER.eos_token
|
| 46 |
|
| 47 |
# Load model directly to GPU
|
| 48 |
+
MODEL = AutoModelForCausalLM.from_pretrained(MODEL_NAME)
|
|
|
|
|
|
|
|
|
|
| 49 |
MODEL.eval()
|
| 50 |
MODEL.to("cuda")
|
| 51 |
|