Spaces:

FractalAIResearch
/

Fathom-R1-14B

Running

App Files Files Community

FractalAIR commited on May 13

Commit

d50edab

verified ·

1 Parent(s): e54749a

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -52

app.py CHANGED Viewed

@@ -24,57 +24,6 @@ def generate_conversation_id():
     return str(uuid.uuid4())[:8]
-'''def generate_response(user_message, max_tokens, temperature, top_p, history_state):
-    if not user_message.strip():
-        return history_state, history_state
-    start_tag = "<|im_start|>"
-    sep_tag = "<|im_sep|>"
-    end_tag = "<|im_end|>"
-    system_message = "Your role as an assistant..."
-    messages = [{"role": "system", "content": system_message}]
-    for message in history_state:
-        messages.append({"role": message["role"], "content": message["content"]})
-    messages.append({"role": "user", "content": user_message})
-    try:
-        response = client.chat.completions.create(
-            model="tgi",
-            messages=messages,
-            max_tokens=int(max_tokens),
-            temperature=temperature,
-            top_p=top_p,
-            stream=True,
-            extra_body={"max_new_tokens": int(max_tokens)}
-        )
-    except Exception as e:
-        print(f"[ERROR] OpenAI API call failed: {e}")
-        yield history_state + [{"role": "user", "content": user_message},
-                               {"role": "assistant", "content": "⚠️ Generation failed."}], history_state
-        return
-    assistant_response = ""
-    new_history = history_state + [
-        {"role": "user", "content": user_message},
-        {"role": "assistant", "content": ""}
-    ]
-    try:
-        for chunk in response:
-            if not chunk.choices or not chunk.choices[0].delta or not chunk.choices[0].delta.content:
-                continue
-            token = chunk.choices[0].delta.content
-            assistant_response += token
-            new_history[-1]["content"] = assistant_response.strip()
-            yield new_history, new_history
-    except Exception:
-        pass
-    yield new_history, new_history'''
 import tiktoken
 enc = tiktoken.encoding_for_model("gpt-3.5-turbo")  # any OpenAI encoding works
@@ -272,4 +221,14 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
     example3_button.click(fn=lambda: gr.update(value=example_messages["JEE Main 2025 Probability & Statistics"]), inputs=None, outputs=user_input)
     example4_button.click(fn=lambda: gr.update(value=example_messages["JEE Main 2025 Laws of Motion"]), inputs=None, outputs=user_input)
-demo.launch(share=True, ssr_mode=False)

     return str(uuid.uuid4())[:8]
 import tiktoken
 enc = tiktoken.encoding_for_model("gpt-3.5-turbo")  # any OpenAI encoding works
     example3_button.click(fn=lambda: gr.update(value=example_messages["JEE Main 2025 Probability & Statistics"]), inputs=None, outputs=user_input)
     example4_button.click(fn=lambda: gr.update(value=example_messages["JEE Main 2025 Laws of Motion"]), inputs=None, outputs=user_input)
+#demo.launch(share=True, ssr_mode=False)
+if __name__ == "__main__":
+    demo.queue(                                       # turn the queue on
+        concurrency_count = 8,                       # how many jobs run simultaneously
+        max_size         = 40,                       # 40-6 = 34 jobs can wait in line
+        api_open         = False                    # no public /queue/status endpoint
+    ).launch(
+        share     = True,
+        ssr_mode  = False
+    )