tlam commited on
Commit
19ec6fa
·
verified ·
1 Parent(s): ed2b2b2

Upload 3 files

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -16,8 +16,9 @@ processor = AutoProcessor.from_pretrained(MODEL_ID)
16
  # Load Model
17
  model = Qwen2_5_VLForConditionalGeneration.from_pretrained(
18
  MODEL_ID,
19
- torch_dtype=torch.float16
20
- ).to(device).eval()
 
21
  print("Model loaded.")
22
 
23
  @spaces.GPU
 
16
  # Load Model
17
  model = Qwen2_5_VLForConditionalGeneration.from_pretrained(
18
  MODEL_ID,
19
+ torch_dtype=torch.bfloat16,
20
+ low_cpu_mem_usage=True,
21
+ ).eval()
22
  print("Model loaded.")
23
 
24
  @spaces.GPU