Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -30,14 +30,14 @@ tokenizer = AutoTokenizer.from_pretrained(model_name)
|
|
| 30 |
model = AutoModelForCausalLM.from_pretrained(
|
| 31 |
model_name,
|
| 32 |
device_map=device,
|
| 33 |
-
torch_dtype=torch.
|
| 34 |
)
|
| 35 |
#model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto", torch_dtype="auto")
|
| 36 |
qa_pipeline = pipeline(
|
| 37 |
"text-generation",
|
| 38 |
model=model,
|
| 39 |
tokenizer=tokenizer,
|
| 40 |
-
max_new_tokens=
|
| 41 |
pad_token_id=tokenizer.eos_token_id
|
| 42 |
)
|
| 43 |
|
|
|
|
| 30 |
model = AutoModelForCausalLM.from_pretrained(
|
| 31 |
model_name,
|
| 32 |
device_map=device,
|
| 33 |
+
torch_dtype=torch.float16 if device == "cuda" else torch.float32
|
| 34 |
)
|
| 35 |
#model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto", torch_dtype="auto")
|
| 36 |
qa_pipeline = pipeline(
|
| 37 |
"text-generation",
|
| 38 |
model=model,
|
| 39 |
tokenizer=tokenizer,
|
| 40 |
+
max_new_tokens=1500,
|
| 41 |
pad_token_id=tokenizer.eos_token_id
|
| 42 |
)
|
| 43 |
|