OIC

Runtime error

File size: 46,348 Bytes

# -*- coding: utf-8 -*-
import gradio as gr 
import requests 
import json 
import os 
import datetime 
import textwrap 
import random 
import threading
import webbrowser 
import shutil 
import time

# ========================================================= 
# --- VERSIONING --- 
# =========================================================
VERSION = "1.0h"  # v1.0h: CRITICAL SPACING FIX: Replaced restrictive .isalnum() space re-insertion logic to correctly add spaces after punctuation marks when followed by a word token.

# ========================================================= 
# --- CONFIGURATION & DATA PERSISTENCE --- 
# ========================================================= 
SETTINGS_FILE = "openrouter_settings.json"
HISTORY_FILE = "openrouter_history.json"
DEFAULT_MODEL = "deepseek/deepseek-chat-v3.1:free"
MAX_BACKUPS = 5 

DEFAULT_SETTINGS = {
    "api_key": "",
    "system_prompt": "You are a helpful, creative, and friendly AI assistant running on an Android device.",
    "model": DEFAULT_MODEL,
    "temperature": 0.7,
    "max_tokens": 1024,
    "response_tokens": 0,
    "top_p": 0.9,
    "frequency_penalty": 0.0,
    "presence_penalty": 0.0,
    "stream": True,
    "top_k": 0,
    "min_p": 0.0,
    "top_a": 0.0,
    "repetition_penalty": 1.0,
    "seed": -1
}

NEW_PRESET_SETTINGS = {
    "api_key": " ",
    "system_prompt": "You are a helpful assistant.",
    "model": "cognitivecomputations/dolphin-mistral-24b-venice-edition:free",
    "temperature": 1.05,
    "max_tokens": 0,
    "response_tokens": 2272,
    "top_p": 0.65,
    "frequency_penalty": 0.0,
    "presence_penalty": 0.0,
    "stream": True,
    "top_k": 0,
    "min_p": 0.0,
    "top_a": 0.0,
    "repetition_penalty": 1.39,
    "seed": -1
}

# =========================================================
# --- Globals for incremental logging (in-memory only) ---
# =========================================================
last_logged_index = 0
active_session_name = None
_last_save_time = 0.0
_save_interval = 0.5 

def load_data(file_path, default_data=None):
    """Loads JSON data from file or returns default."""
    if default_data is None:
        default_data = {}

    if os.path.exists(file_path):
        try:
            with open(file_path, "r", encoding="utf-8") as f:
                data = json.load(f)
it
            if isinstance(default_data, list):
                if isinstance(data, list):
                    return data
                if isinstance(data, dict) and "history" in data and isinstance(data["history"], list):
                    return data["history"]
                return default_data

            if isinstance(data, dict):
                for key, default_val in DEFAULT_SETTINGS.items():
                    for preset_name in data.get('presets', {}):
                        if key not in data['presets'][preset_name]:
                            data['presets'][preset_name][key] = default_val
                return data
            return default_data

        except (json.JSONDecodeError, IOError):
            print(f"Warning: Could not parse {file_path}, using default.")
            return default_data
    return default_data

def save_data(file_path, data):
    """Saves dictionary or list as JSON (Used for history in this version)."""
    try:
        with open(file_path, "w", encoding="utf-8") as f:
            json.dump(data, f, indent=4, ensure_ascii=False)
    except IOError as e:
        print(f"Error saving {file_path}: {e}")

def create_rolling_backup(file_path, max_backups=MAX_BACKUPS):
    """Creates a rolling backup of the settings file before overwriting it."""
    if not os.path.exists(file_path):
        return

    oldest_backup = f"{file_path}.b{max_backups}"
    if os.path.exists(oldest_backup):
        os.remove(oldest_backup)

    for i in range(max_backups - 1, 0, -1):
        src = f"{file_path}.b{i}"
        dst = f"{file_path}.b{i+1}"
        if os.path.exists(src):
            try:
                os.rename(src, dst)
            except OSError as e:
                print(f"Warning: Could not rename {src} to {dst}: {e}")

    newest_backup = f"{file_path}.b1"
    try:
        shutil.copy2(file_path, newest_backup)
        print(f"Settings backed up to {newest_backup}")
    except IOError as e:
        print(f"Error creating backup {newest_backup}: {e}")

def save_settings_to_disk(file_path, data):
    """Handles backup and then saves the settings data."""
    create_rolling_backup(file_path)
    try:
        with open(file_path, "w", encoding="utf-8") as f:
            json.dump(data, f, indent=4)
    except IOError as e:
        print(f"Error saving {file_path}: {e}")

# Initialize settings container
all_settings = load_data(SETTINGS_FILE, {
    "presets": {"Default": DEFAULT_SETTINGS}, 
    "last_preset_name": "Default"
})

# Ensure structure integrity
if "presets" not in all_settings or not isinstance(all_settings["presets"], dict):
    all_settings = {"presets": {"Default": DEFAULT_SETTINGS}, "last_preset_name": "Default"}

chat_history = load_data(HISTORY_FILE, []) 
if not isinstance(chat_history, list):
    chat_history = []

# Load last preset
last_preset_name = all_settings.get("last_preset_name", "Default")
current_settings = all_settings["presets"].get(last_preset_name, DEFAULT_SETTINGS).copy()

# ========================================================= 
# --- Stop control (thread-safe) ---
# =========================================================
stop_event = threading.Event()

def quit_app():
    """Immediately quits the application via os._exit."""
    print("Quitting application...")
    # Use a timer to exit after a slight delay to allow the server to send the response.
    threading.Timer(0.1, os._exit, args=[0]).start()
    # CRITICAL FIX v1.0c: The function returns the update dictionaries
    return gr.Markdown.update(value="ðŸ‘‹ Shutting down...", visible=True), gr.update(interactive=False)

# ========================================================= 
# --- OPENROUTER API INTERACTION (STREAMING & FALLBACK) --- 
# ========================================================= 

def call_openrouter_api(messages, settings):
    """Makes a streaming API call to OpenRouter, yields content chunks.
    Filters <|begin of sentence|> token.
    """
    api_key = settings.get("api_key").strip()
    if not api_key:
        yield "ERROR: API Key not set in Settings."
        return

    url = "https://openrouter.ai/api/v1/chat/completions"
    
    try:
        payload = {
            "model": settings["model"],
            "messages": messages,
            "temperature": float(settings.get("temperature", 0.7)),
            "top_p": float(settings.get("top_p", 0.9)),
            "frequency_penalty": float(settings.get("frequency_penalty", 0.0)),
            "presence_penalty": float(settings.get("presence_penalty", 0.0)),
            "stream": True,
        }
        
        response_tokens = int(settings.get("response_tokens", 0))
        if response_tokens > 0:
            payload["max_tokens"] = response_tokens

        for k in ["top_k", "min_p", "top_a", "repetition_penalty", "seed"]:
            v = settings.get(k)
            if v is not None:
                if k == "top_k" and int(v) == 0: continue
                if k in ("min_p", "top_a") and float(v) == 0.0: continue
                if k == "repetition_penalty" and float(v) == 1.0: continue
                if k == "seed" and int(v) == -1: continue
                payload[k] = v

    except ValueError as e:
        yield f"ERROR: Invalid setting type. {e}"
        return

    headers = {
        "Authorization": f"Bearer {api_key}",
        "Content-Type": "application/json"
    }
    
    # Filter tokens (v1.0a: half-width, v1.0g: full-width)
    TOKEN_TO_FILTER_HALF = "<|begin of sentence|>"
    TOKEN_TO_FILTER_FULL = "<ï½œbegin of sentenceï½œ>"

    try:
        response = requests.post(url, headers=headers, json=payload, stream=True, timeout=60)

        if response.status_code != 200:
            try:
                msg = response.json().get('error', {}).get('message', response.text)
            except Exception:
                msg = response.text
            yield f"âŒ API request failed ({response.status_code}): {msg}"
            return

        got_content = False
        for line_bytes in response.iter_lines():
            if stop_event.is_set():
                yield "â›” Inference stopped by user."
                return

            if not line_bytes:
                continue
                
            try:
                line = line_bytes.decode('utf-8')
            except UnicodeDecodeError:
                print("Warning: Failed to decode a line from API stream.")
                continue

            if line.startswith("data:"):
                data_str = line[len("data:"):].strip()
                if data_str == "[DONE]":
                    break
                
                try:
                    chunk = json.loads(data_str)
                except Exception:
                    continue
                
                choices = chunk.get("choices", [])
                if not choices:
                    continue
                
                choice0 = choices[0]
                delta = choice0.get("delta", {})
                content = delta.get("content")

                if content:
                    # CRITICAL FIX v1.0g: Apply filters for both half-width and full-width tokens
                    if TOKEN_TO_FILTER_FULL in content:
                        content = content.replace(TOKEN_TO_FILTER_FULL, "")
                    if TOKEN_TO_FILTER_HALF in content:
                        content = content.replace(TOKEN_TO_FILTER_HALF, "")
                    
                    # CRITICAL FIX v1.0f: Strip leading whitespace potentially left by token removal.
                    content = content.lstrip() 

                    if content: # Check if anything is left
                        got_content = True
                        yield content
                
                if choice0.get("finish_reason") is not None:
                    break
            
            elif line.startswith("event: error"):
                try:
                    errdata = json.loads(line[len("event: error"):].strip())
                    yield f"STREAM ERROR: {errdata.get('message', 'Unknown Stream Error')}"
                except Exception:
                    yield "STREAM ERROR: unknown"
                return

        if not got_content:
            # Silent fallback to non-streaming
            payload["stream"] = False
            try:
                r2 = requests.post(url, headers=headers, json=payload, timeout=60)
                if r2.status_code == 200:
                    j = r2.json()
                    content = None
                    choices = j.get("choices", [])
                    if choices:
                        first = choices[0]
                        if isinstance(first.get("message"), dict):
                            content = first["message"].get("content")
                        elif "text" in first:
                            content = first.get("text")
                        elif isinstance(first.get("delta"), dict):
                            content = first["delta"].get("content")
                    
                    if content:
                        # Apply filters
                        if TOKEN_TO_FILTER_FULL in content:
                            content = content.replace(TOKEN_TO_FILTER_FULL, "")
                        if TOKEN_TO_FILTER_HALF in content:
                            content = content.replace(TOKEN_TO_FILTER_HALF, "")

                        # CRITICAL FIX v1.0f: Strip leading/trailing whitespace
                        content = content.strip() 

                        if content: # Check if anything is left after stripping
                            yield content
                    else:
                        yield "âš ï¸ No content received from fallback response."

                else:
                    yield f"âŒ Fallback failed ({r2.status_code}): {r2.text}"

            except requests.exceptions.RequestException as e:
                yield f"âŒ Fallback request error: {e}"

    except requests.exceptions.RequestException as e:
        yield f"âŒ Request error: {e}"
    except Exception as e:
        yield f"ðŸ’¥ Unexpected error: {e}"


# ========================================================= 
# --- CHAT FUNCTIONALITY & STATE MANAGEMENT --- 
# ========================================================= 

# Helper function to convert Gradio's old list-of-tuples history to new messages format
def convert_to_messages_format(history):
    new_history = []
    for user_msg, bot_msg in history:
        if user_msg:
            new_history.append({"role": "user", "content": user_msg})
        if bot_msg:
            new_history.append({"role": "assistant", "content": bot_msg})
    return new_history

def chat_interface(user_input, history_state):
    """Handles message submission and response generation with streaming."""
    global current_settings, _last_save_time

    if stop_event.is_set():
        stop_event.clear()

    if not user_input.strip():
        # Yields the converted history back to the chatbot and updates the state
        yield convert_to_messages_format(history_state), history_state, gr.update(interactive=True) 
        return

    # Add user message to the internal list-of-tuples state
    history_state.append([user_input, None])

    # 1. IMMEDIATE SAVE OF USER MESSAGE ðŸ’¾
    save_current_session(history_state)
    _last_save_time = time.time() 

    # Prepare for response: send the current list-of-tuples state converted for display, 
    # the state itself, and disable input
    yield convert_to_messages_format(history_state), history_state, gr.update(value="", interactive=False)

    # Prepare API messages
    messages = [{"role": "system", "content": current_settings["system_prompt"]}]
    
    for user_msg, bot_msg in history_state[:-1]:
        if user_msg: messages.append({"role": "user", "content": user_msg})
        if bot_msg: messages.append({"role": "assistant", "content": bot_msg})

    messages.append({"role": "user", "content": user_input})
    
    full_reply = ""
    for chunk in call_openrouter_api(messages, current_settings):
        is_error_or_stop = isinstance(chunk, str) and (chunk.startswith("ERROR:") or chunk.startswith("âŒ") or chunk.startswith("ðŸ’¥"))
        
        if is_error_or_stop:
            full_reply += ("\n\n" + chunk) if full_reply else chunk
            history_state[-1][1] = full_reply
            save_current_session(history_state)
            # Send the updated state (converted for display)
            yield convert_to_messages_format(history_state), history_state, gr.update(interactive=True) 
            return
        
        if isinstance(chunk, str) and chunk.startswith("â›” Inference stopped"):
            full_reply += "\n\n*(Inference stopped)*"
            history_state[-1][1] = full_reply
            save_current_session(history_state) 
            # Send the updated state (converted for display)
            yield convert_to_messages_format(history_state), history_state, gr.update(interactive=True)
            return

        if isinstance(chunk, str) and chunk.startswith("â›” Inference stopped"):
            full_reply += "\n\n*(Inference stopped)*"
            history_state[-1][1] = full_reply
            save_current_session(history_state) 
            # Send the updated state (converted for display)
            yield convert_to_messages_format(history_state), history_state, gr.update(interactive=True)
            return

        # v1.0h CRITICAL SPACING FIX: Updated logic to correctly add a space after punctuation.
        if full_reply and chunk:
            # Add a space if the previous character is NOT a space, AND the new chunk starts with a letter or digit.
            if full_reply[-1] != ' ' and chunk[0].isalnum():
                full_reply += " " + chunk
            else:
                full_reply += chunk
        else:
            full_reply += chunk # Handles the very first chunk

        history_state[-1][1] = full_reply

        # Send the updated state (converted for display)
        yield convert_to_messages_format(history_state), history_state, gr.update(interactive=False)

    # 2. FINAL SAVE OF ASSISTANT MESSAGE ðŸ’¾
    history_state[-1][1] = full_reply
    save_current_session(history_state)
    _last_save_time = time.time()
    
    # Send the final state (converted for display)
    yield convert_to_messages_format(history_state), history_state, gr.update(interactive=True)


def save_current_session(history):
    """Saves session to history file incrementally (only new turns)."""
    global chat_history, last_logged_index, active_session_name

    if not history or not any(user_msg for user_msg, _ in history):
        return

    sanitized = [
        [user_msg, bot_msg if bot_msg else "*(Incomplete Response)*"]
        for user_msg, bot_msg in history if user_msg
    ]

    is_continuation = False
    last_entry = chat_history[-1] if chat_history else None
    
    if last_entry:
        if active_session_name and active_session_name == last_entry.get("name"):
            is_continuation = True
        else:
            existing_hist = last_entry.get("history", [])
            if len(existing_hist) <= len(sanitized) and existing_hist == sanitized[:len(existing_hist)]:
                active_session_name = last_entry.get("name")
                last_logged_index = len(existing_hist)
                is_continuation = True
            
    if is_continuation and last_entry:
        updated_history = last_entry.get("history", []).copy()
        
        # Case 1: Updating the last turn (Assistant complete save, where length is equal)
        if len(sanitized) == len(updated_history) and len(sanitized) > 0:
            updated_history[-1] = sanitized[-1]
            
        # Case 2: Appending new turns (Next User send save, where live history is longer)
        elif len(sanitized) > len(updated_history):
            start_idx = len(updated_history)
            novel_portion = sanitized[start_idx:]
            updated_history.extend(novel_portion)

        chat_history[-1] = {"name": last_entry.get("name"), "history": updated_history}
        save_data(HISTORY_FILE, chat_history)

        last_logged_index = len(sanitized)
    
    else:
        first_message = history[0][0]
        name_base = textwrap.shorten(first_message, width=30, placeholder="...")
        proposed_name = f"{datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S')} - {name_base}"

        chat_history.append({"name": proposed_name, "history": sanitized})
        save_data(HISTORY_FILE, chat_history)
        
        active_session_name = proposed_name
        last_logged_index = len(sanitized)


def new_chat(history):
    """Clears chat and saves current session. Resets incremental-log indices."""
    global last_logged_index, active_session_name

    if history:
        save_current_session(history)
    last_logged_index = 0
    active_session_name = None
    return [], [] # returns empty list for chatbot (messages format) and empty list for state (tuples format)

def get_history_names():
    return [s["name"] for s in chat_history]

def load_history_session(name):
    """Loads session content for the history display (History tab only)."""
    if name is None:
        return []
        
    for session in chat_history:
        if session["name"] == name:
            # Load list-of-tuples and convert to messages format for display
            return convert_to_messages_format(session["history"])
    return []

def refresh_history_dropdown(history):
    """Return updated choices for the history dropdown (value cleared)."""
    return gr.update(choices=get_history_names(), value=None)

def set_stop_event():
    """Set the stop_event to true so the streaming loop will stop."""
    stop_event.set()
    return

def clear_history_log():
    """Backs up history file and clears chat_history in memory and on disk. (v1.0a)"""
    global chat_history, last_logged_index, active_session_name
    
    message = "History log already clear."
    
    if os.path.exists(HISTORY_FILE):
        timestamp = datetime.datetime.now().strftime('%Y%m%d_%H%M%S')
        backup_file = f"{HISTORY_FILE}.{timestamp}.ahv"
        
        try:
            shutil.copy2(HISTORY_FILE, backup_file)
            os.remove(HISTORY_FILE)
            message = f"History log backed up to `{backup_file}` and cleared."
        except Exception as e:
            message = f"ERROR backing up/clearing log: {e}"

    chat_history = []
    last_logged_index = 0
    active_session_name = None
    
    return (
        [], # Clear history_display (messages format)
        gr.update(value=None, choices=[]), # Clear visible_history_dropdown
        gr.update(value=None, choices=[]), # Clear history_dropdown_ref
        message, # Update history_message
        gr.update(choices=get_preset_names()) # Clear preset_dropdown (just for full output list)
    )

def copy_all_session_text(name):
    """Formats and returns the entire history session content as text for copying. (v1.0a)"""
    if name is None:
        return "No session selected."
    
    for session in chat_history:
        if session["name"] == name:
            text = f"--- Session: {name} ---\n\n"
            for user_msg, bot_msg in session["history"]:
                text += f"USER: {user_msg}\n"
                text += f"ASSISTANT: {bot_msg}\n\n"
            return text
    return "Session not found."

# ========================================================= 
# --- SETTINGS FUNCTIONALITY --- 
# ========================================================= 

def get_preset_names():
    return list(all_settings["presets"].keys())

def save_settings(
    preset_name, api_key, sys_prompt, model, temp, tokens, response_tokens, top_p, freq_p, pres_p, 
    top_k, min_p, top_a, rep_p, seed 
):
    """Save new or updated preset, with rolling backup."""
    global all_settings, current_settings
    
    name_to_save = preset_name if preset_name.strip() else all_settings.get("last_preset_name", "Default")
    
    new_settings = {
        "api_key": api_key, "system_prompt": sys_prompt, "model": model, "temperature": temp, 
        "max_tokens": tokens, "response_tokens": response_tokens, "top_p": top_p, 
        "frequency_penalty": freq_p, "presence_penalty": pres_p, 
        "stream": current_settings.get("stream", True), "top_k": top_k, "min_p": min_p, 
        "top_a": top_a, "repetition_penalty": rep_p, "seed": seed,
    }
    
    all_settings["presets"][name_to_save] = new_settings
    all_settings["last_preset_name"] = name_to_save 
    
    save_settings_to_disk(SETTINGS_FILE, all_settings) 

    if name_to_save == all_settings.get("last_preset_name", "Default"):
        current_settings = new_settings.copy()

    return f"Settings saved as '{name_to_save}'. Backups created (max {MAX_BACKUPS}).", gr.update(choices=get_preset_names(), value=name_to_save)


def load_settings(preset_name):
    """Load settings preset and update chat tab's model display."""
    global all_settings, current_settings
    
    if preset_name is None or preset_name not in all_settings["presets"]:
        settings_to_load = current_settings.copy()
    else:
        settings_to_load = all_settings["presets"].get(preset_name, DEFAULT_SETTINGS).copy()

    current_settings = settings_to_load.copy()
    
    if preset_name and preset_name in all_settings["presets"]:
        all_settings["last_preset_name"] = preset_name
        save_settings_to_disk(SETTINGS_FILE, all_settings) 
    
    for key, default_val in DEFAULT_SETTINGS.items():
        if key not in settings_to_load:
            settings_to_load[key] = default_val

    return (
        settings_to_load["api_key"], settings_to_load["system_prompt"], settings_to_load["model"],
        settings_to_load["temperature"], settings_to_load["max_tokens"], 
        settings_to_load.get("response_tokens", DEFAULT_SETTINGS.get("response_tokens", 0)),
        settings_to_load["top_p"], settings_to_load["frequency_penalty"], settings_to_load["presence_penalty"],
        settings_to_load.get("top_k", DEFAULT_SETTINGS["top_k"]), settings_to_load.get("min_p", DEFAULT_SETTINGS["min_p"]),
        settings_to_load.get("top_a", DEFAULT_SETTINGS["top_a"]),
        settings_to_load.get("repetition_penalty", DEFAULT_SETTINGS["repetition_penalty"]),
        settings_to_load.get("seed", DEFAULT_SETTINGS["seed"]),
        f"Settings '{preset_name}' loaded.", f"### Current Model: `{settings_to_load['model']}`",
        gr.update(value=preset_name) 
    )

def create_new_preset(new_preset_name):
    """Creates a new preset with specific defaults, loads it, and updates the list."""
    global all_settings
    
    if not new_preset_name or not new_preset_name.strip():
        load_results = load_settings(all_settings.get("last_preset_name", "Default"))
        return load_results + (gr.update(choices=get_preset_names()),)
    
    name = new_preset_name.strip()
    
    if name in all_settings["presets"]:
        load_results = load_settings(all_settings.get("last_preset_name", "Default"))
        load_results = load_results[:-3] + (f"Error: Preset '{name}' already exists.",) + load_results[-2:]
        return load_results + (gr.update(choices=get_preset_names()),)
        
    all_settings["presets"][name] = NEW_PRESET_SETTINGS.copy()
    all_settings["last_preset_name"] = name
    save_settings_to_disk(SETTINGS_FILE, all_settings) 
    
    load_results = load_settings(name)

    return load_results[:-3] + (
        f"Preset '{name}' created and loaded.",
        f"### Current Model: `{NEW_PRESET_SETTINGS['model']}`",
        gr.update(value=name), 
        gr.update(choices=get_preset_names(), value=name), 
    )

# ========================================================= 
# --- GRADIO UI (MAIN) --- 
# ========================================================= 

CHATBOT_HEIGHT = "50vh"

custom_css = f"""
/* Target the user_input Textbox. */
.gradio-container #user_input_wrapper textarea {{
    min-height: 40px !important; 
    transition: min-height 0.2s ease-in-out;
}}
/* Hide Gradio footer (v1.0a) */
footer {{ visibility: hidden !important; height: 0 !important; }}

/* Reduce space between chatbot and input (v1.0a) */
.gradio-container #user_input_wrapper {{
    margin-top: 5px !important;
    padding-top: 0 !important;
}}

/* Ensure the main title is gone (v1.0a) */
.gradio-container h2:first-child {{
    display: none !important;
}}

/* Hide Gradio settings button in the top right (v1.0a) */
.gradio-container button[aria-label="Settings"] {{
    display: none !important;
}}

/* Fix for tab label text padding after removing text (v1.0e) */
.gradio-container .tabs > div > button.selected {{
    padding: 0 10px !important;
}}

/* --- NEW FULL-WIDTH FIXES --- */

/* 1. Target the main content area inside the container and remove default padding */
.gradio-container .main {{
    padding-left: 0 !important;
    padding-right: 0 !important;
}}

/* 2. Target the main page wrapper/block and remove default padding */
.gradio-container .block {{
    padding-left: 0 !important;
    padding-right: 0 !important;
}}

/* 3. Ensure the Tabs content container also takes full width and remove its internal padding */
.gradio-container .tabitem {{
    padding: 0 !important;
}}

/* 4. Ensure the Chatbot itself takes the full width and apply a minimal buffer (5px) on the sides */
.gradio-container .gradio-chatbot {{
    width: 100% !important;
    margin: 0 !important;
    padding: 0 5px !important; 
}}

/* 5. Apply the minimal buffer (5px) to the User Input/Controls Row to align with the Chatbot */
.gradio-container #user_input_wrapper {{
    padding: 0 5px !important;
}}

/* Apply 5px padding to the button row (requires the new elem_classes=["send_btn_row"] on the gr.Row) */
.gradio-container .send_btn_row {{
    padding: 0 5px !important;
}}
"""

with gr.Blocks(title=f"Termux LLM Client (OpenRouter) v{VERSION}", css=custom_css) as app: 
    # Store history as a list of tuples (user_msg, bot_msg) to simplify API and saving logic
    session_history = gr.State(value=[])
    current_model_display = gr.Markdown(f"### Current Model: `{current_settings['model']}`", visible=False) 
    
    # Hide the main title (v1.0a)
    gr.Markdown(f"## ðŸ¤– Termux LLM Client (OpenRouter) v{VERSION}", visible=False) 

    # CRITICAL FIX v1.0d: Define the shutdown component explicitly for use in outputs list
    shutdown_message = gr.Markdown("", visible=False) 

    with gr.Row(visible=False):
        pass
        
    # --- Tab Bar with Quit Button (v1.0e: Isolated Quit Button and Tabs) ---
    with gr.Row(variant="compact", equal_height=False): 
        # QUIT BUTTON: scale=0 ensures minimum width, positioned on the far left (Fix 2)
        quit_btn = gr.Button("âŒ", variant="stop", scale=0, min_width=40)
        
        # COLUMN WRAPPER: Takes all remaining horizontal space for the tabs, preventing UI squeeze (Fix 2)
        with gr.Column(scale=100): 
            # TABS (Fix 3: Icons only)
            with gr.Tabs() as tabs: 
                
                # ---------------------- CHAT TAB (ðŸ’¬) ----------------------
                with gr.TabItem("ðŸ’¬"): # Fix 3: Icon only
                    # Use type='messages' (v1.0c)
                    chatbot = gr.Chatbot(
                        label="Chat History", 
                        height=CHATBOT_HEIGHT, 
                        show_copy_button=True,
                        type='messages' 
                    )
                    
                    with gr.Row(elem_id="user_input_wrapper"):
                        user_input = gr.Textbox(
                            placeholder="Type your message...",
                            label="Your Prompt",
                            show_label=False,
                            lines=3, 
                        )
                    
                    # MODIFIED: Added elem_classes to apply the CSS padding fix
                    with gr.Row(variant="compact", elem_classes=["send_btn_row"]):
                        send_btn = gr.Button("âž¤", variant="primary", scale=1, min_width=0)
                        stop_btn = gr.Button("â›”", variant="stop", scale=1, min_width=0)
                        new_chat_btn = gr.Button("ðŸ—‘ï¸", variant="secondary", scale=1, min_width=0)

                    with gr.Row(visible=False):
                        history_dropdown_ref = gr.Dropdown(
                            label="Hidden History Dropdown Ref",
                            choices=get_history_names(),
                            value=None,
                            interactive=True
                        )
                    
                    def _refresh_history_dropdown_output(history):
                        return refresh_history_dropdown(history)

                    # Handler for chat, inputs are user_input and session_history (tuples)
                    # Outputs are chatbot (messages), session_history (tuples), and user_input (update)
                    send_btn.click(
                        chat_interface,
                        inputs=[user_input, session_history],
                        outputs=[chatbot, session_history, user_input],
                        show_progress=True, 
                    ).then(
                        _refresh_history_dropdown_output, inputs=[session_history], outputs=[history_dropdown_ref]
                    )
                    
                    user_input.submit(
                        chat_interface,
                        inputs=[user_input, session_history],
                        outputs=[chatbot, session_history, user_input],
                        show_progress=True, 
                    ).then(
                        _refresh_history_dropdown_output, inputs=[session_history], outputs=[history_dropdown_ref]
                    )
                    
                    stop_btn.click(set_stop_event, inputs=[], outputs=[])
                    
                    # new_chat returns empty list for both chatbot display and state
                    new_chat_btn.click(
                        new_chat, inputs=[session_history], outputs=[chatbot, session_history], show_progress=False
                    ).then(
                        _refresh_history_dropdown_output, inputs=[session_history], outputs=[history_dropdown_ref]
                    )

                    # Resend/Retry logic (adapted for new 'messages' type)
                    try:
                        def get_user_msg_for_resend(idx, h):
                            # Find the Nth user message in the list of tuples
                            user_index_counter = -1
                            for u_msg, _ in h:
                                if u_msg:
                                    user_index_counter += 1
                                if user_index_counter == idx:
                                    return u_msg
                            return ""

                        chatbot.message_event(
                            get_user_msg_for_resend,
                            inputs=[gr.Index(), session_history], 
                            outputs=[user_input], 
                            label="Resend User"
                        )
                    except Exception: pass
                    
                    try:
                        def _retry(idx, h):
                            if idx is None or not h: return convert_to_messages_format(h), h, gr.update(interactive=True)
                            
                            # Gradio Index is message number (0-indexed). 
                            # We need to find the user message that started the turn being clicked on.
                            
                            # 1. Determine the number of complete turns (pairs) + incomplete turn
                            num_turns = len(h)
                            
                            # 2. Map the message index (idx) to the turn index (turn_idx)
                            # In the new format, index 0 is user 1, index 1 is bot 1, index 2 is user 2, etc.
                            turn_idx = idx // 2 

                            if turn_idx >= num_turns: 
                                # Clicked a message outside the range (e.g., if history was cleared)
                                return convert_to_messages_format(h), h, gr.update(interactive=True)

                            # Get the user message from the target turn
                            user_msg = h[turn_idx][0]
                            if not user_msg:
                                 # This should not happen if the click was on a valid turn
                                return convert_to_messages_format(h), h, gr.update(interactive=True) 

                            # New history state is everything *before* the turn we are retrying
                            new_hist = h[:turn_idx] 

                            # Call the chat interface with the user message and the shortened history
                            return chat_interface(user_msg, new_hist)

                        chatbot.message_event(
                            _retry, 
                            inputs=[gr.Index(), session_history], 
                            outputs=[chatbot, session_history, user_input], 
                            label="Retry Assistant"
                        )
                    except Exception: pass


                # ---------------------- SETTINGS TAB (âš™ï¸) ----------------------
                with gr.TabItem("âš™ï¸"): # Fix 3: Icon only
                    settings_message = gr.Markdown(f"Loaded preset: **{all_settings.get('last_preset_name', 'Default')}**")
                    
                    with gr.Row():
                        preset_dropdown = gr.Dropdown(
                            label="Select Preset (Loads on selection)",
                            choices=get_preset_names(), # Fix 1: Correctly uses get_preset_names()
                            value=all_settings.get("last_preset_name", "Default"),
                            interactive=True, scale=2
                        )
                        save_name_input = gr.Textbox(
                            label="Current Preset Name", value=all_settings.get("last_preset_name", "Default"), visible=False
                        )
                        new_preset_btn = gr.Button("âœ¨ New Preset", variant="secondary", scale=1)
                        save_btn = gr.Button("ðŸ’¾ Save Current", variant="primary", scale=1) 

                    new_preset_name_box = gr.Textbox(visible=False)

                    gr.Markdown("---")
                    gr.Markdown("### API and Model Parameters")

                    api_key_input = gr.Textbox(label="OpenRouter API Key (Plaintext)", value=current_settings["api_key"], type="text", info="Saved in openrouter_settings.json")
                    system_prompt_input = gr.Textbox(label="System Prompt", value=current_settings["system_prompt"], lines=3)

                    with gr.Row():
                        model_input = gr.Textbox(label="Model Name", value=current_settings["model"], info="deepseek/deepseek-chat-v3.1:free\nopenai/gpt-oss-20b:free\ncognitivecomputations/dolphin-mistral-24b-venice-edition:free",  scale=2)
                        temperature_input = gr.Slider(label="Temperature", minimum=0.0, maximum=2.0, step=0.05, value=current_settings["temperature"], scale=1)
                        max_tokens_input = gr.Slider(label="Max Tokens (Model Limit Dependent)", minimum=0, maximum=130000, step=1, value=current_settings["max_tokens"], scale=1)

                    with gr.Row():
                        response_tokens_input = gr.Slider(label="Response Tokens (0 = model decides)", minimum=0, maximum=32768, step=1, value=current_settings.get("response_tokens", DEFAULT_SETTINGS.get("response_tokens", 0)), scale=1)
                        top_p_input = gr.Slider(label="Top P", minimum=0.0, maximum=1.0, step=0.05, value=current_settings["top_p"], scale=1)
                        freq_p_input = gr.Slider(label="Frequency Penalty", minimum=0, maximum=2.0, step=0.05, value=current_settings["frequency_penalty"], scale=1)
                        pres_p_input = gr.Slider(label="Presence Penalty", minimum=0, maximum=2.0, step=0.05, value=current_settings["presence_penalty"], scale=1)
                    
                    gr.Markdown("---")
                    gr.Markdown("### Advanced Sampling Controls")

                    with gr.Row():
                        top_k_input = gr.Slider(label="Top K (0 to disable)", minimum=0, maximum=100, step=1, value=current_settings.get("top_k", DEFAULT_SETTINGS["top_k"]), scale=1)
                        min_p_input = gr.Slider(label="Min P (0.0 to disable)", minimum=0.0, maximum=1.0, step=0.01, value=current_settings.get("min_p", DEFAULT_SETTINGS["min_p"]), scale=1)
                        top_a_input = gr.Slider(label="Top A (0.0 to disable)", minimum=0.0, maximum=1.0, step=0.01, value=current_settings.get("top_a", DEFAULT_SETTINGS["top_a"]), scale=1)

                    with gr.Row():
                        rep_p_input = gr.Slider(label="Repetition Penalty (1.0 is neutral)", minimum=0.0, maximum=2.0, step=0.01, value=current_settings.get("repetition_penalty", DEFAULT_SETTINGS["repetition_penalty"]), scale=1)
                        seed_input = gr.Number(label="Seed (-1 for random)", minimum=-1, value=current_settings.get("seed", DEFAULT_SETTINGS["seed"]), scale=1)
                    
                    save_btn.click(
                        save_settings,
                        inputs=[save_name_input, api_key_input, system_prompt_input, model_input, temperature_input, max_tokens_input, response_tokens_input, top_p_input, freq_p_input, pres_p_input, top_k_input, min_p_input, top_a_input, rep_p_input, seed_input],
                        outputs=[settings_message, preset_dropdown]
                    )
                    
                    preset_dropdown.change(
                        load_settings,
                        inputs=[preset_dropdown],
                        outputs=[api_key_input, system_prompt_input, model_input, temperature_input, max_tokens_input, response_tokens_input, top_p_input, freq_p_input, pres_p_input, top_k_input, min_p_input, top_a_input, rep_p_input, seed_input, settings_message, current_model_display, save_name_input]
                    )

                    new_preset_btn.click(
                        None, inputs=[], outputs=[new_preset_name_box],
                        js="""() => prompt('Enter a name for the new preset:') || ''"""
                    )

                    new_preset_name_box.change(
                        create_new_preset, inputs=[new_preset_name_box], 
                        outputs=[api_key_input, system_prompt_input, model_input, temperature_input, max_tokens_input, response_tokens_input, top_p_input, freq_p_input, pres_p_input, top_k_input, min_p_input, top_a_input, rep_p_input, seed_input, settings_message, current_model_display, save_name_input, preset_dropdown]
                    )


                # ---------------------- HISTORY TAB (ðŸ“œ) ----------------------
                with gr.TabItem("ðŸ“œ"): # Fix 3: Icon only
                    history_message = gr.Markdown("### Historical Chat Sessions")
                    
                    with gr.Row():
                        visible_history_dropdown = gr.Dropdown(
                            label="Load Session",
                            choices=get_history_names(),
                            value=None,
                            interactive=True, scale=2
                        )
                        load_history_btn = gr.Button("View Session", variant="secondary", scale=1)
                        # COPY ALL BUTTON (v1.0a)
                        copy_all_btn = gr.Button("ðŸ“‹ Copy All", variant="secondary", scale=1)
                        # CLEAR LOG BUTTON (v1.0a)
                        clear_log_btn = gr.Button("ðŸ—‘ï¸ Clear Log", variant="secondary", scale=1)
                        
                    # Use type='messages' (v1.0c)
                    history_display = gr.Chatbot(
                        label="Historical Session Content", 
                        height=CHATBOT_HEIGHT, 
                        type='messages',
                        show_copy_button=True # Per-message copy (v1.0a)
                    )
                    
                    # Hidden element to hold the text for the Copy All functionality
                    copy_text_output = gr.Textbox(visible=False, label="Copy Text") 

                    # Event Handlers
                    history_dropdown_ref.change(
                        lambda value: gr.update(choices=get_history_names(), value=value),
                        inputs=[history_dropdown_ref], outputs=[visible_history_dropdown], show_progress=False
                    )
                    
                    visible_history_dropdown.change(
                        load_history_session, inputs=[visible_history_dropdown], outputs=[history_display]
                    )

                    load_history_btn.click(
                        load_history_session, inputs=[visible_history_dropdown], outputs=[history_display]
                    )
                    
                    # Copy All handler (v1.0a)
                    copy_all_btn.click(
                        copy_all_session_text,
                        inputs=[visible_history_dropdown],
                        outputs=[copy_text_output]
                    ).then(
                        lambda x: (gr.Markdown.update(value=f"Copied {len(x)} characters from session."), gr.update(value="")),
                        inputs=[copy_text_output],
                        outputs=[history_message, copy_text_output]
                    )
                    
                    # Clear Log handler (v1.0a)
                    clear_log_btn.click(
                        clear_history_log,
                        inputs=[],
                        outputs=[history_display, visible_history_dropdown, history_dropdown_ref, history_message, preset_dropdown]
                    )
        
    # --- Quit Button Handler (placed outside tabs for global visibility) ---
    quit_btn.click(
        quit_app,
        # CRITICAL FIX v1.0d: Outputs must be component objects, matching the return values (Markdown Update, Generic Update for Button)
        outputs=[shutdown_message, quit_btn] 
    )


# ========================================================= 
# --- LAUNCH --- 
# ========================================================= 

# ========================================================= 
# --- LAUNCH (HUGGING FACE SPACES FIX) --- 
# ========================================================= 

if __name__ == "__main__":
    # CRITICAL FIX 1: Hardcode the server port to 7860, which is the standard 
    # expected by the Hugging Face Spaces router.
    PORT = 7860
    
    # CRITICAL FIX 2: Remove all unnecessary local print statements and 
    # the thread that tries to open a browser (webbrowser.open), as this 
    # is impossible in the cloud environment and causes issues.
    
    print(f"Launching Termux LLM Client v{VERSION} on 0.0.0.0:{PORT} (Hugging Face Mode)")
    
    app.launch(
        server_name="0.0.0.0", 
        server_port=PORT, 
        # Set inbrowser=False to prevent the app from trying to launch a browser
        inbrowser=False, 
        debug=False, # Debug output is usually too verbose for HFS logs
        quiet=False # Set to False or remove, so you can see the startup logs
    )