Executor-Tyrant-Framework Claude Opus 4.6 (1M context) commited on
Commit
487e5c0
·
1 Parent(s): 0f055ca

Fix: increase GPU timeout to 180s, remove torch_dtype kwarg

Browse files

3.25GB download + 5 inference passes was exceeding 120s.
Let from_pretrained use its default dtype (avoids deprecation warning).

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

Files changed (1) hide show
  1. app.py +2 -5
app.py CHANGED
@@ -30,7 +30,7 @@ GRAPH = None
30
  MODEL_NAME = "gpt2-large"
31
 
32
 
33
- @spaces.GPU(duration=120)
34
  def load_and_train():
35
  """Load model + train predictor in a single GPU call."""
36
  global MODEL, TOKENIZER, MEMBRANE, PREDICTOR, GRAPH
@@ -45,10 +45,7 @@ def load_and_train():
45
  TOKENIZER.pad_token = TOKENIZER.eos_token
46
 
47
  # Load model directly to GPU
48
- MODEL = AutoModelForCausalLM.from_pretrained(
49
- MODEL_NAME,
50
- torch_dtype=torch.float32,
51
- )
52
  MODEL.eval()
53
  MODEL.to("cuda")
54
 
 
30
  MODEL_NAME = "gpt2-large"
31
 
32
 
33
+ @spaces.GPU(duration=180)
34
  def load_and_train():
35
  """Load model + train predictor in a single GPU call."""
36
  global MODEL, TOKENIZER, MEMBRANE, PREDICTOR, GRAPH
 
45
  TOKENIZER.pad_token = TOKENIZER.eos_token
46
 
47
  # Load model directly to GPU
48
+ MODEL = AutoModelForCausalLM.from_pretrained(MODEL_NAME)
 
 
 
49
  MODEL.eval()
50
  MODEL.to("cuda")
51