Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -16,10 +16,20 @@ import os
|
|
| 16 |
|
| 17 |
def http_bot_yield(prompt):
|
| 18 |
headers = {"User-Agent": "vLLM Client"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 19 |
pload = {
|
| 20 |
-
"prompt": f"
|
| 21 |
"stream": True,
|
| 22 |
-
"max_tokens":
|
| 23 |
"temperature": 0.1
|
| 24 |
}
|
| 25 |
response = requests.post(
|
|
|
|
| 16 |
|
| 17 |
def http_bot_yield(prompt):
|
| 18 |
headers = {"User-Agent": "vLLM Client"}
|
| 19 |
+
system_message = """
|
| 20 |
+
Below is an instruction that describes a task. Write a response that appropriately completes the request.
|
| 21 |
+
"""
|
| 22 |
+
# pload = {
|
| 23 |
+
# "prompt": f"<s>[INST] {prompt} [/INST] ",
|
| 24 |
+
# "stream": True,
|
| 25 |
+
# "max_tokens": 1024,
|
| 26 |
+
# "temperature": 0.1
|
| 27 |
+
# }
|
| 28 |
+
|
| 29 |
pload = {
|
| 30 |
+
"prompt": f"### System:\n{system_message}\n\n\n\n### Instruction:\n{prompt}\n\n### Response:\n",
|
| 31 |
"stream": True,
|
| 32 |
+
"max_tokens": 2048,
|
| 33 |
"temperature": 0.1
|
| 34 |
}
|
| 35 |
response = requests.post(
|