eikarna
commited on
Commit
·
c376a77
1
Parent(s):
f858b89
Minor Update
Browse files
app.py
CHANGED
|
@@ -36,7 +36,7 @@ def load_model():
|
|
| 36 |
model = AutoModelForCausalLM.from_pretrained(
|
| 37 |
MODEL_NAME,
|
| 38 |
trust_remote_code=True,
|
| 39 |
-
torch_dtype=torch.
|
| 40 |
device_map="auto"
|
| 41 |
)
|
| 42 |
|
|
@@ -71,7 +71,6 @@ def generate_response(prompt: str, settings: Dict[str, Any]) -> str:
|
|
| 71 |
max_new_tokens=settings["max_tokens"],
|
| 72 |
temperature=settings["temperature"],
|
| 73 |
top_p=settings["top_p"],
|
| 74 |
-
do_sample=True,
|
| 75 |
pad_token_id=st.session_state.tokenizer.eos_token_id
|
| 76 |
)
|
| 77 |
|
|
|
|
| 36 |
model = AutoModelForCausalLM.from_pretrained(
|
| 37 |
MODEL_NAME,
|
| 38 |
trust_remote_code=True,
|
| 39 |
+
torch_dtype=torch.float16,
|
| 40 |
device_map="auto"
|
| 41 |
)
|
| 42 |
|
|
|
|
| 71 |
max_new_tokens=settings["max_tokens"],
|
| 72 |
temperature=settings["temperature"],
|
| 73 |
top_p=settings["top_p"],
|
|
|
|
| 74 |
pad_token_id=st.session_state.tokenizer.eos_token_id
|
| 75 |
)
|
| 76 |
|