Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
|
@@ -87,7 +87,7 @@ model = AutoModel.from_pretrained(
|
|
| 87 |
torch_dtype=torch.bfloat16,
|
| 88 |
attn_implementation='flash_attention_2',
|
| 89 |
low_cpu_mem_usage=True,
|
| 90 |
-
trust_remote_code=True).eval().cuda()
|
| 91 |
processor = AutoProcessor.from_pretrained(model_name, trust_remote_code=True, token=auth_token)
|
| 92 |
streamer = TextIteratorStreamer(processor.tokenizer, skip_prompt=True, skip_special_tokens=True, timeout=15)
|
| 93 |
|
|
|
|
| 87 |
torch_dtype=torch.bfloat16,
|
| 88 |
attn_implementation='flash_attention_2',
|
| 89 |
low_cpu_mem_usage=True,
|
| 90 |
+
trust_remote_code=True, token=auth_token).eval().cuda()
|
| 91 |
processor = AutoProcessor.from_pretrained(model_name, trust_remote_code=True, token=auth_token)
|
| 92 |
streamer = TextIteratorStreamer(processor.tokenizer, skip_prompt=True, skip_special_tokens=True, timeout=15)
|
| 93 |
|