Update app.py
Browse files
app.py
CHANGED
|
@@ -8,10 +8,10 @@ print(os.environ)
|
|
| 8 |
openai.api_base = os.environ.get("OPENAI_API_BASE")
|
| 9 |
openai.api_key = os.environ.get("OPENAI_API_KEY")
|
| 10 |
|
| 11 |
-
BASE_SYSTEM_MESSAGE = """"""
|
| 12 |
|
| 13 |
def make_prediction(prompt, max_tokens=None, temperature=None, top_p=None, top_k=None, repetition_penalty=None):
|
| 14 |
-
completion = openai.Completion.create(model="
|
| 15 |
for chunk in completion:
|
| 16 |
yield chunk["choices"][0]["text"]
|
| 17 |
|
|
@@ -33,10 +33,10 @@ def chat(history, system_message, max_tokens, temperature, top_p, top_k, repetit
|
|
| 33 |
history = history or []
|
| 34 |
|
| 35 |
messages = BASE_SYSTEM_MESSAGE + system_message.strip() + "\n" + \
|
| 36 |
-
"\n".join(["\n".join(["User
|
| 37 |
for item in history])
|
| 38 |
# strip the last `<|end_of_turn|>` from the messages
|
| 39 |
-
messages = messages.rstrip("<|end_of_turn|>")
|
| 40 |
# remove last space from assistant, some models output a ZWSP if you leave a space
|
| 41 |
messages = messages.rstrip()
|
| 42 |
|
|
|
|
| 8 |
openai.api_base = os.environ.get("OPENAI_API_BASE")
|
| 9 |
openai.api_key = os.environ.get("OPENAI_API_KEY")
|
| 10 |
|
| 11 |
+
BASE_SYSTEM_MESSAGE = """### System Prompt\n"""
|
| 12 |
|
| 13 |
def make_prediction(prompt, max_tokens=None, temperature=None, top_p=None, top_k=None, repetition_penalty=None):
|
| 14 |
+
completion = openai.Completion.create(model="Phind/Phind-CodeLlama-34B-v2", prompt=prompt, max_tokens=max_tokens, temperature=temperature, top_p=top_p, top_k=top_k, repetition_penalty=repetition_penalty, stream=True, stop=["</s>", "<|im_end|>"])
|
| 15 |
for chunk in completion:
|
| 16 |
yield chunk["choices"][0]["text"]
|
| 17 |
|
|
|
|
| 33 |
history = history or []
|
| 34 |
|
| 35 |
messages = BASE_SYSTEM_MESSAGE + system_message.strip() + "\n" + \
|
| 36 |
+
"\n".join(["\n".join(["### User Message\n"+item[0]+"\n\n", "### Assistant\n"+item[1]+"\n\n"])
|
| 37 |
for item in history])
|
| 38 |
# strip the last `<|end_of_turn|>` from the messages
|
| 39 |
+
#messages = messages.rstrip("<|end_of_turn|>")
|
| 40 |
# remove last space from assistant, some models output a ZWSP if you leave a space
|
| 41 |
messages = messages.rstrip()
|
| 42 |
|