Commit
·
3247c3a
1
Parent(s):
b748e45
testing num return sequences
Browse files
README.md
CHANGED
|
@@ -5,7 +5,7 @@ colorFrom: gray
|
|
| 5 |
colorTo: purple
|
| 6 |
sdk: gradio
|
| 7 |
sdk_version: 3.37.0
|
| 8 |
-
app_file: app
|
| 9 |
pinned: true
|
| 10 |
license: bigcode-openrail-m
|
| 11 |
tags:
|
|
|
|
| 5 |
colorTo: purple
|
| 6 |
sdk: gradio
|
| 7 |
sdk_version: 3.37.0
|
| 8 |
+
app_file: app.py
|
| 9 |
pinned: true
|
| 10 |
license: bigcode-openrail-m
|
| 11 |
tags:
|
app.py
CHANGED
|
@@ -139,7 +139,7 @@ def generate(input_message: str, db_info="", temperature=0.2, top_p=0.9, top_k=0
|
|
| 139 |
|
| 140 |
input_ids = tok(messages, return_tensors="pt").input_ids
|
| 141 |
input_ids = input_ids.to(m.device)
|
| 142 |
-
streamer = TextIteratorStreamer(tok, timeout=1000.0, skip_prompt=True, skip_special_tokens=True)
|
| 143 |
generate_kwargs = dict(
|
| 144 |
input_ids=input_ids,
|
| 145 |
max_new_tokens=max_new_tokens,
|
|
@@ -147,27 +147,36 @@ def generate(input_message: str, db_info="", temperature=0.2, top_p=0.9, top_k=0
|
|
| 147 |
top_p=top_p,
|
| 148 |
top_k=top_k,
|
| 149 |
repetition_penalty=repetition_penalty,
|
| 150 |
-
streamer=streamer,
|
| 151 |
stopping_criteria=StoppingCriteriaList([stop]),
|
| 152 |
num_return_sequences=num_return_sequences,
|
| 153 |
num_beams=num_beams,
|
| 154 |
do_sample=do_sample,
|
| 155 |
)
|
| 156 |
|
| 157 |
-
stream_complete = Event()
|
| 158 |
|
| 159 |
-
def generate_and_signal_complete():
|
| 160 |
-
|
| 161 |
-
|
| 162 |
|
| 163 |
-
t1 = Thread(target=generate_and_signal_complete)
|
| 164 |
-
t1.start()
|
| 165 |
|
| 166 |
-
|
| 167 |
-
for new_text in streamer:
|
| 168 |
-
partial_text += new_text
|
| 169 |
|
| 170 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 171 |
|
| 172 |
if log:
|
| 173 |
# Log the request to Firestore
|
|
|
|
| 139 |
|
| 140 |
input_ids = tok(messages, return_tensors="pt").input_ids
|
| 141 |
input_ids = input_ids.to(m.device)
|
| 142 |
+
#streamer = TextIteratorStreamer(tok, timeout=1000.0, skip_prompt=True, skip_special_tokens=True)
|
| 143 |
generate_kwargs = dict(
|
| 144 |
input_ids=input_ids,
|
| 145 |
max_new_tokens=max_new_tokens,
|
|
|
|
| 147 |
top_p=top_p,
|
| 148 |
top_k=top_k,
|
| 149 |
repetition_penalty=repetition_penalty,
|
| 150 |
+
#streamer=streamer,
|
| 151 |
stopping_criteria=StoppingCriteriaList([stop]),
|
| 152 |
num_return_sequences=num_return_sequences,
|
| 153 |
num_beams=num_beams,
|
| 154 |
do_sample=do_sample,
|
| 155 |
)
|
| 156 |
|
| 157 |
+
#stream_complete = Event()
|
| 158 |
|
| 159 |
+
# def generate_and_signal_complete():
|
| 160 |
+
# m.generate(**generate_kwargs)
|
| 161 |
+
# stream_complete.set()
|
| 162 |
|
| 163 |
+
# t1 = Thread(target=generate_and_signal_complete)
|
| 164 |
+
# t1.start()
|
| 165 |
|
| 166 |
+
tokens = m.generate(**generate_kwargs)
|
|
|
|
|
|
|
| 167 |
|
| 168 |
+
responses = []
|
| 169 |
+
for response in tokens:
|
| 170 |
+
response_text = tok.decode(response, skip_special_tokens=True)
|
| 171 |
+
|
| 172 |
+
# Only take what comes after ### Response:
|
| 173 |
+
response_text = response_text.split("### Response:")[1].strip()
|
| 174 |
+
|
| 175 |
+
formatted_text = format(response_text) if format_sql else response_text
|
| 176 |
+
responses.append(formatted_text)
|
| 177 |
+
|
| 178 |
+
# Concat responses to be a single string seperated by a newline
|
| 179 |
+
output = "\n".join(responses)
|
| 180 |
|
| 181 |
if log:
|
| 182 |
# Log the request to Firestore
|