Spaces:

ping98k
/

LLM-Brainstorming

Sleeping

App Files Files Community

ping98k commited on Jun 25, 2025

Commit

753833c

1 Parent(s): 2584782

Update main.py

Browse files

Files changed (1) hide show

main.py +43 -29

main.py CHANGED Viewed

@@ -1,21 +1,31 @@
-import os, json
 from concurrent.futures import ThreadPoolExecutor, as_completed
 from tqdm import tqdm
 from litellm import completion
-import gradio as gr
-NUM_TOP_PICKS = int(os.getenv("NUM_TOP_PICKS", 5))
-POOL_SIZE = int(os.getenv("POOL_SIZE", 20))
-MAX_WORKERS = int(os.getenv("MAX_WORKERS", 10))
-def run_tournament(instruction_input, criteria_input):
     instruction = instruction_input.strip()
     criteria_list = [c.strip() for c in criteria_input.split(",") if c.strip()] or [
-        "Factuality",
-        "Instruction Following",
-        "Precision",
     ]
     def criteria_block():
         return "\n".join(f"{i + 1}) {c}" for i, c in enumerate(criteria_list))
@@ -24,7 +34,7 @@ def run_tournament(instruction_input, criteria_input):
         prompt = f"""Evaluate the output below on the following criteria:
 {criteria_block()}
-Return JSON exactly like: {{\"score\": [{', '.join(['1-10'] * len(criteria_list))}]}}.
 Instruction:
 {instruction}
@@ -33,7 +43,7 @@ Output:
 {player}"""
         response = completion(
             model="gpt-4o-mini",
-            messages=[{"role": "system", "content": prompt}],
         )
         return response.choices[0].message.content.strip()
@@ -49,7 +59,7 @@ Output:
         prompt = f"""Compare the two players below using:
 {criteria_block()}
-Return ONLY JSON {{\"winner\": \"A\"}} or {{\"winner\": \"B\"}}.
 Instruction:
 {instruction}
@@ -59,7 +69,7 @@ Players:
 <B>{b}</B>"""
         response = completion(
             model="gpt-4o-mini",
-            messages=[{"role": "system", "content": prompt}],
         )
         return response.choices[0].message.content.strip()
@@ -104,28 +114,28 @@ Players:
     def playoff(candidates, executor):
         wins = {p: 0 for p in candidates}
-        pairs = [
-            (candidates[i], candidates[j])
-            for i in range(len(candidates))
-            for j in range(i + 1, len(candidates))
-        ]
         futures = {executor.submit(play, a, b): (a, b) for a, b in pairs}
         for fut in tqdm(as_completed(futures), total=len(futures)):
             wins[fut.result()] += 1
         return sorted(candidates, key=lambda p: wins[p], reverse=True)
-    def get_top(players, executor, k=NUM_TOP_PICKS):
         champion, lost_to = tournament(players, executor)
         runner_up = lost_to.get(champion)
         finalists = [champion] + ([runner_up] if runner_up else [])
-        semifinalists = [p for p, o in lost_to.items() if o in finalists and p not in finalists]
-        candidates = set(finalists + semifinalists + get_candidates(champion, lost_to))
-        return playoff(list(candidates), executor)[:k]
-    all_players = [f"S{i}" for i in range(1, 10)]
-    with ThreadPoolExecutor(max_workers=MAX_WORKERS) as ex:
         scores = precompute_scores(all_players, ex)
-        top_players = sorted(all_players, key=scores.get, reverse=True)[:POOL_SIZE]
         top_k = get_top(top_players, ex)
     return ", ".join(top_k)
@@ -134,8 +144,12 @@ demo = gr.Interface(
     inputs=[
         gr.Textbox(lines=2, label="Instruction"),
         gr.Textbox(lines=1, label="Criteria (comma separated)"),
     ],
-    outputs=gr.Textbox(label="Top picks"),
 )
 if __name__ == "__main__":

+import os, json, gradio as gr
 from concurrent.futures import ThreadPoolExecutor, as_completed
 from tqdm import tqdm
 from litellm import completion
+NUM_TOP_PICKS_DEFAULT = int(os.getenv("NUM_TOP_PICKS", 5))
+POOL_SIZE_DEFAULT = int(os.getenv("POOL_SIZE", 20))
+MAX_WORKERS_DEFAULT = int(os.getenv("MAX_WORKERS", 10))
+NUM_GENERATIONS_DEFAULT = int(os.getenv("NUM_GENERATIONS", 100))
+def generate_players(instruction, n):
+    response = completion(
+        model="gpt-4o-mini",
+        messages=[{"role": "user", "content": instruction}],
+        n=n
+    )
+    return [c.message.content.strip() for c in response.choices]
+def run_tournament(instruction_input, criteria_input, n_gen,
+                   num_top_picks, pool_size, max_workers):
     instruction = instruction_input.strip()
     criteria_list = [c.strip() for c in criteria_input.split(",") if c.strip()] or [
+        "Factuality", "Instruction Following", "Precision"
     ]
+    n_gen = int(n_gen)
+    num_top_picks = int(num_top_picks)
+    pool_size = int(pool_size)
+    max_workers = int(max_workers)
     def criteria_block():
         return "\n".join(f"{i + 1}) {c}" for i, c in enumerate(criteria_list))
         prompt = f"""Evaluate the output below on the following criteria:
 {criteria_block()}
+Return JSON exactly like: {{"score": [{', '.join(['1-10'] * len(criteria_list))}]}}.
 Instruction:
 {instruction}
 {player}"""
         response = completion(
             model="gpt-4o-mini",
+            messages=[{"role": "system", "content": prompt}]
         )
         return response.choices[0].message.content.strip()
         prompt = f"""Compare the two players below using:
 {criteria_block()}
+Return ONLY JSON {{"winner": "A"}} or {{"winner": "B"}}.
 Instruction:
 {instruction}
 <B>{b}</B>"""
         response = completion(
             model="gpt-4o-mini",
+            messages=[{"role": "system", "content": prompt}]
         )
         return response.choices[0].message.content.strip()
     def playoff(candidates, executor):
         wins = {p: 0 for p in candidates}
+        pairs = [(candidates[i], candidates[j])
+                 for i in range(len(candidates))
+                 for j in range(i + 1, len(candidates))]
         futures = {executor.submit(play, a, b): (a, b) for a, b in pairs}
         for fut in tqdm(as_completed(futures), total=len(futures)):
             wins[fut.result()] += 1
         return sorted(candidates, key=lambda p: wins[p], reverse=True)
+    def get_top(players, executor):
         champion, lost_to = tournament(players, executor)
         runner_up = lost_to.get(champion)
         finalists = [champion] + ([runner_up] if runner_up else [])
+        semifinalists = [p for p, o in lost_to.items()
+                         if o in finalists and p not in finalists]
+        candidates = set(finalists + semifinalists +
+                         get_candidates(champion, lost_to))
+        return playoff(list(candidates), executor)[:num_top_picks]
+    all_players = generate_players(instruction, n_gen)
+    with ThreadPoolExecutor(max_workers=max_workers) as ex:
         scores = precompute_scores(all_players, ex)
+        top_players = sorted(all_players, key=scores.get, reverse=True)[:pool_size]
         top_k = get_top(top_players, ex)
     return ", ".join(top_k)
     inputs=[
         gr.Textbox(lines=2, label="Instruction"),
         gr.Textbox(lines=1, label="Criteria (comma separated)"),
+        gr.Number(value=NUM_GENERATIONS_DEFAULT, label="Number of Generations"),
+        gr.Number(value=NUM_TOP_PICKS_DEFAULT, label="Top Picks (k)"),
+        gr.Number(value=POOL_SIZE_DEFAULT, label="Pool Size"),
+        gr.Number(value=MAX_WORKERS_DEFAULT, label="Max Workers")
     ],
+    outputs=gr.Textbox(label="Top picks")
 )
 if __name__ == "__main__":