Spaces:

khazarai
/

Bio-Reasoning

Sleeping

File size: 3,638 Bytes

import gradio as gr
from transformers import AutoTokenizer, AutoModelForCausalLM
from peft import PeftModel
import torch

# --- Load tokenizer and model for CPU ---
tokenizer = AutoTokenizer.from_pretrained("unsloth/Qwen3-1.7B")

base_model = AutoModelForCausalLM.from_pretrained(
    "unsloth/Qwen3-1.7B",
    dtype=torch.float32,
    device_map={"": "cpu"},
)

model = PeftModel.from_pretrained(base_model, "khazarai/BioGenesis-ToT").to("cpu")


# --- Chatbot logic ---
def generate_response(user_input, chat_history):
    if not user_input.strip():
        return chat_history, chat_history

    chat_history.append({"role": "user", "content": user_input})

    text = tokenizer.apply_chat_template(
        chat_history,
        tokenize=False,
        add_generation_prompt=True,
        enable_thinking=True,
    )

    inputs = tokenizer(text, return_tensors="pt").to("cpu")

    output_tokens = model.generate(
        **inputs,
        max_new_tokens=2200,
        temperature=0.6,
        top_p=0.95,
        top_k=20,
        do_sample=True 
    )

    response = tokenizer.decode(output_tokens[0], skip_special_tokens=True)
    response = response.split(user_input)[-1].strip()

    chat_history.append({"role": "assistant", "content": response})

    gr_chat_history = [
        (m["content"], chat_history[i + 1]["content"])
        for i, m in enumerate(chat_history[:-1])
        if m["role"] == "user"
    ]

    return gr_chat_history, chat_history


# --- UI Design ---
with gr.Blocks(theme=gr.themes.Soft(primary_hue="emerald", secondary_hue="slate")) as demo:
    gr.HTML("""
    <div style="text-align: center; margin-bottom: 20px;">
        <h1 style="font-family: 'Inter', sans-serif; font-weight: 800; color: #047857; font-size: 2.2em;">
            🧬 BioGenesis-ToT Chatbot
        </h1>
        <p style="color: #4B5563; font-size: 1.05em; margin-top: -10px;">
            Your AI companion for biology, biochemistry, and life sciences.
        </p>
        <p style="color: #4B5563; font-size: 1.05em; margin-top: -10px;">   
            NOTE: The model's answers may be shorter or slightly different because this instance runs on CPU using float32, unlike the GPU float16 setup used during fine-tuning.
        </p>
    </div>
    """)

    with gr.Row():
        with gr.Column(scale=6):
            chatbot = gr.Chatbot(
                label="BioGenesis Chat",
                height=600,
                bubble_full_width=True,
                show_copy_button=True,
                avatar_images=(
                    "https://cdn-icons-png.flaticon.com/512/1077/1077012.png",  # user icon
                    "https://cdn-icons-png.flaticon.com/512/4140/4140048.png",  # bot icon
                ),
            )
            user_input = gr.Textbox(
                placeholder="Ask me about cell biology, molecular structure, or biochemistry...",
                label="💬 Your question",
                lines=3,
                autofocus=True,
            )
            with gr.Row():
                send_btn = gr.Button("🚀 Send", variant="primary")
                clear_btn = gr.Button("🧹 Clear Chat")

    state = gr.State([])

    send_btn.click(generate_response, [user_input, state], [chatbot, state])
    user_input.submit(generate_response, [user_input, state], [chatbot, state])
    clear_btn.click(lambda: ([], []), None, [chatbot, state])

    gr.HTML("""
    <div style="text-align: center; margin-top: 25px; color: #6B7280; font-size: 0.9em;">
        Powered by <b>Qwen3-1.7B + BioGenesis-ToT</b> | Built with ❤️ using Gradio
    </div>
    """)

demo.launch(share=True)