Spaces:
Sleeping
Sleeping
Upload app.py with huggingface_hub
Browse files
app.py
CHANGED
|
@@ -194,19 +194,21 @@ def generate_spec(
|
|
| 194 |
{"role": "user", "content": user_content},
|
| 195 |
]
|
| 196 |
|
| 197 |
-
|
| 198 |
-
messages, tokenize=
|
| 199 |
-
)
|
|
|
|
|
|
|
| 200 |
|
| 201 |
outputs = model.generate(
|
| 202 |
-
|
| 203 |
max_new_tokens=max_tokens,
|
| 204 |
temperature=temperature,
|
| 205 |
top_p=top_p,
|
| 206 |
do_sample=True,
|
| 207 |
)
|
| 208 |
|
| 209 |
-
generated = outputs[0][
|
| 210 |
return tokenizer.decode(generated, skip_special_tokens=True)
|
| 211 |
|
| 212 |
|
|
|
|
| 194 |
{"role": "user", "content": user_content},
|
| 195 |
]
|
| 196 |
|
| 197 |
+
input_text = tokenizer.apply_chat_template(
|
| 198 |
+
messages, tokenize=False, add_generation_prompt=True
|
| 199 |
+
)
|
| 200 |
+
inputs = tokenizer(input_text, return_tensors="pt").to(model.device)
|
| 201 |
+
input_len = inputs["input_ids"].shape[-1]
|
| 202 |
|
| 203 |
outputs = model.generate(
|
| 204 |
+
**inputs,
|
| 205 |
max_new_tokens=max_tokens,
|
| 206 |
temperature=temperature,
|
| 207 |
top_p=top_p,
|
| 208 |
do_sample=True,
|
| 209 |
)
|
| 210 |
|
| 211 |
+
generated = outputs[0][input_len:]
|
| 212 |
return tokenizer.decode(generated, skip_special_tokens=True)
|
| 213 |
|
| 214 |
|