Spaces:

Nyanfa
/

claude-chat-ui

Running

File size: 28,205 Bytes

import anthropic
import streamlit as st
from streamlit.components.v1 import html
from streamlit_extras.stylable_container import stylable_container
import re
import urllib.parse
import traceback
import os

st.title("Claude Chat UI")

if "api_key" not in st.session_state and os.path.exists("api_key.dat"):
    with open("api_key.dat", "r", encoding="utf-8") as f:
        st.session_state.api_key = f.readline().strip()

if "api_key" not in st.session_state:
    api_key = st.text_input("Enter your API Key", type="password")
    
    if not api_key:
        st.warning("Please enter your API key to use the app.")
        st.stop()
    
    if not api_key.isascii():
        st.warning("Please enter your API key correctly.")
        st.stop()
    
    st.session_state.api_key = api_key
    client = anthropic.Anthropic(api_key=api_key)
    st.rerun()
else:
    client = anthropic.Anthropic(api_key=st.session_state.api_key)

if "messages" not in st.session_state:
    st.session_state.messages = []

if "prefill" not in st.session_state:
    st.session_state.prefill = ""

if "use_continue" not in st.session_state:
    st.session_state.use_continue = False

if "message_continue" not in st.session_state:
    st.session_state.message_continue = ""

if "exception" not in st.session_state:
    st.session_state.exception = None

if "use_thinking" not in st.session_state:
    st.session_state.use_thinking = False

if "thinking_budget_tokens" not in st.session_state:
    st.session_state.thinking_budget_tokens = 1024

if "last_thinking" not in st.session_state:
    st.session_state.last_thinking = ""

def count_tokens(text):
    if len(text) > 0:
        response = client.messages.count_tokens(
            model=model,
            messages = [{
                "role": "user",
                "content": text
            }]
        )
        tokens = response.input_tokens
        return tokens
    else:
        return 0
    
def get_truncated_index(messages, limit_val, limit_unit, additional_tokens):
    """ Find index of first message within truncated context

    Args:
        messages (list): Input messages for anthropic API
        limit_val (int): Context length limitation
        limit_unit (str): "Turns" or "Tokens"
        additional_tokens (int): Token count of system prompt

    Returns:
        int: index of first message within truncated context
    """
    if limit_val == 0:
        return 0

    if limit_unit == "Turns":
        # Unit: Turns
        count_turn = 0
        for i in reversed(range(len(messages))):
            if messages[i]["role"] == "user":
                count_turn += 1
                if count_turn == limit_val:
                    return i
        return 0
    else:
        # Unit: Tokens
        last_user_index = len(messages)
        total_tokens = additional_tokens
        for i in reversed(range(len(messages))):
            total_tokens += count_tokens(messages[i]["content"])
            if total_tokens > limit_val:
                return last_user_index
            if messages[i]["role"] == "user":
                last_user_index = i
        return last_user_index

def get_truncated_context(messages, limit_val, limit_unit, additional_tokens):
    """ Return truncated context

    Args:
        messages (list): Input messages for anthropic API
        limit_val (int): Context length limitation
        limit_unit (str): "Turns" or "Tokens"
        additional_tokens (int): Token count of system prompt

    Returns:
        list: Truncated input messages for anthropic API
    """
    first_message_index = get_truncated_index(messages, limit_val, limit_unit, additional_tokens)

    if first_message_index >= len(messages):
        return []
    
    return messages[first_message_index:]

def get_ai_response(messages):
    st.session_state.is_streaming = True
    st.session_state.response = ""
    shown_message = ""
    st.session_state.last_thinking = ""

    st.session_state.message_continue = st.session_state.message_continue.strip()
    st.session_state.prefill = st.session_state.prefill.strip()
    if st.session_state.message_continue != "":
        messages.append({"role": "assistant", "content": st.session_state.message_continue})
        st.session_state.response += st.session_state.message_continue
        shown_message = st.session_state.message_continue.replace("\n", "  \n")
    elif st.session_state.prefill:
        messages.append({"role": "assistant", "content": st.session_state.prefill})
        st.session_state.response += st.session_state.prefill
        shown_message = st.session_state.prefill.replace("\n", "  \n")

    api_messages = []
    for msg in messages:
        api_msg = {"role": msg["role"], "content": msg["content"]}
        api_messages.append(api_msg)

    api_messages = get_truncated_context(api_messages, limit_val, limit_unit, count_tokens(system_prompt))
    st.session_state.exception = None

    try:
        with st.chat_message("assistant", avatar=st.session_state.assistant_avatar): 
            placeholder = st.empty()

            with stylable_container(
                key="stop_generating",
                css_styles="""
                    button {
                        position: fixed;
                        bottom: 100px;
                        left: 50%;
                        transform: translateX(-50%);
                        z-index: 1;
                    }
                    """,
            ):
                st.button("Stop generating")

            # Configure thinking parameter
            thinking_param = None
            if st.session_state.use_thinking:
                thinking_param = {
                    "type": "enabled",
                    "budget_tokens": st.session_state.thinking_budget_tokens
                }
                
            # Prepare kwargs for the API call
            stream_kwargs = {
                "messages": api_messages,
                "model": model,
                "max_tokens": max_tokens,
                "system": system_prompt,
                "temperature": temperature,
            }
            
            # Add thinking parameter if enabled
            if thinking_param:
                stream_kwargs["thinking"] = thinking_param
            elif "-4-5-" not in model:
                # Only add top_p and top_k when thinking is disabled and not a 4-5 model
                # Claude 4-5 models don't support temperature + top_p/top_k simultaneously
                stream_kwargs["top_p"] = top_p
                stream_kwargs["top_k"] = top_k
            
            with client.messages.stream(**stream_kwargs) as stream:
                # Stream event handling
                current_block_type = None
                
                for event in stream:
                    if event.type == "content_block_start":
                        current_block_type = event.content_block.type
                    
                    elif event.type == "content_block_delta":
                        if event.delta.type == "thinking_delta" and current_block_type == "thinking":
                            content = str(event.delta.thinking) if event.delta.thinking is not None else ""
                            st.session_state.last_thinking += content
                            shown_message += content.replace("\n", "  \n")\
                                                  .replace("<", "\\<")\
                                                  .replace(">", "\\>")
                            placeholder.markdown(shown_message)
                        elif event.delta.type == "text_delta" and current_block_type == "text":
                            content = str(event.delta.text) if event.delta.text is not None else ""
                            st.session_state.response += content
                            shown_message += content.replace("\n", "  \n")\
                                                  .replace("<", "\\<")\
                                                  .replace(">", "\\>")
                            placeholder.markdown(shown_message)

    except Exception as e:
        st.session_state.exception = e

    st.session_state.is_streaming = False
    return st.session_state.response

def normalize_code_block(match):
    return match.group(0).replace("  \n", "\n")\
                         .replace("\\<", "<")\
                         .replace("\\>", ">")

def normalize_inline(match):
    return match.group(0).replace("\\<", "<")\
                         .replace("\\>", ">")

code_block_pattern = r"(```.*?```)"
inline_pattern = r"`([^`\n]+?)`"

def display_messages():
    for i, message in enumerate(st.session_state.messages):
        if message["role"] == "user":
            avatar = st.session_state.user_avatar
        else:
            avatar = st.session_state.assistant_avatar
        
        with st.chat_message(message["role"], avatar=avatar):
            # Add expander for thinking if it exists
            if message["role"] == "assistant" and "thinking" in message and message["thinking"]:
                with st.expander("Show Claude's thinking process"):
                    thinking_text = message["thinking"].replace("\n", "  \n")\
                                                     .replace("<", "\\<")\
                                                     .replace(">", "\\>")
                    if "```" in thinking_text:
                        thinking_text = re.sub(code_block_pattern, normalize_code_block, thinking_text, flags=re.DOTALL)
                    if "`" in thinking_text:
                        thinking_text = re.sub(inline_pattern, normalize_inline, thinking_text)
                    st.markdown(thinking_text)
            
            shown_message = message["content"].replace("\n", "  \n")\
                                            .replace("<", "\\<")\
                                            .replace(">", "\\>")
            if "```" in shown_message:
                # Replace "  \n" with "\n" within code blocks
                shown_message = re.sub(code_block_pattern, normalize_code_block, shown_message, flags=re.DOTALL)
            if "`" in shown_message:
                shown_message = re.sub(inline_pattern, normalize_inline, shown_message)
            st.markdown(shown_message)

            if st.session_state.get("show_message_tokens"):
                message_tokens = count_tokens(message["content"])
                st.info(f'Tokens: {message_tokens}')

            col1, col2, col3, col4 = st.columns([1, 1, 1, 1])
            with col1:
                if st.button("Edit", key=f"edit_{i}_{len(st.session_state.messages)}"):
                    st.session_state.edit_index = i
                    st.rerun()
            with col2:
                if st.session_state.is_delete_mode and st.button("Delete", key=f"delete_{i}_{len(st.session_state.messages)}"):
                    del st.session_state.messages[i]
                    st.rerun()
            with col3:
                text_to_copy = message["content"]
                # Encode the string to escape
                text_to_copy_escaped = urllib.parse.quote(text_to_copy)

                copy_button_html = f"""
                <button id="copy-msg-btn-{i}" style='font-size: 1em; padding: 0.5em;' onclick='copyMessage("{i}")'>Copy</button>
                
                <script>
                function copyMessage(index) {{
                    navigator.clipboard.writeText(decodeURIComponent("{text_to_copy_escaped}"));
                    let copyBtn = document.getElementById("copy-msg-btn-" + index);
                    copyBtn.innerHTML = "Copied!";
                    setTimeout(function(){{ copyBtn.innerHTML = "Copy"; }}, 2000);
                }}
                </script>
                """
                html(copy_button_html, height=50)

            if i == len(st.session_state.messages) - 1 and message["role"] == "assistant":
                with col4:
                    if st.button("Retry", key=f"retry_{i}_{len(st.session_state.messages)}"):
                        if len(st.session_state.messages) >= 2:
                            if st.session_state.get("use_continue"):
                                st.session_state.message_continue = st.session_state.messages[-1]["content"]
                            del st.session_state.messages[-1]
                            st.session_state.retry_flag = True
                            st.rerun()
        
        if "edit_index" in st.session_state and st.session_state.edit_index == i:
            with st.form(key=f"edit_form_{i}_{len(st.session_state.messages)}"):
                new_content = st.text_area("Edit message", height=200, value=st.session_state.messages[i]["content"])
                col1, col2 = st.columns([1, 1])
                with col1:
                    if st.form_submit_button("Save"):
                        st.session_state.messages[i]["content"] = new_content
                        del st.session_state.edit_index
                        st.rerun()
                with col2:
                    if st.form_submit_button("Cancel"):
                        del st.session_state.edit_index
                        st.rerun()
    if st.session_state.exception:
        st.exception(st.session_state.exception)
    
# Add sidebar for advanced settings
with st.sidebar:
    settings_tab, appearance_tab = st.tabs(["Settings", "Appearance"])

    with settings_tab:
        st.markdown("Help (Japanese): https://rentry.org/9hgneofz")
    
        # Copy Conversation History button
        log_text = ""
        for message in st.session_state.messages:
            if message["role"] == "user":
                log_text += "<USER>\n"
                log_text += message["content"] + "\n\n"
            else:
                log_text += "<ASSISTANT>\n"
                if "thinking" in message and message["thinking"]:
                    log_text += "<THINKING>\n"
                    log_text += message["thinking"] + "\n</THINKING>\n"
                log_text += message["content"] + "\n\n"
        log_text = log_text.rstrip("\n")
            
        # Encode the string to escape
        log_text_escaped = urllib.parse.quote(log_text)
        
        copy_log_button_html = f"""
        <button id="copy-log-btn" style='font-size: 1em; padding: 0.5em;' onclick='copyLog()'>Copy Conversation History</button>
        
        <script>
        const log_text_escaped = "{log_text_escaped}";
        function copyLog() {{
            navigator.clipboard.writeText(decodeURIComponent(log_text_escaped));
            const copyBtn = document.getElementById("copy-log-btn");
            copyBtn.innerHTML = "Copied!";
            setTimeout(function(){{ copyBtn.innerHTML = "Copy Conversation History"; }}, 2000);
        }}
        window.parent.document.addEventListener('keydown', (e) => {{
            if ( e.code == "Pause" ){{
                window.parent.navigator.clipboard.writeText(decodeURIComponent(log_text_escaped));
                const copyBtn = document.getElementById("copy-log-btn");
                copyBtn.innerHTML = "Copied!";
                setTimeout(function(){{ copyBtn.innerHTML = "Copy Conversation History"; }}, 2000);
            }}
        }} , false);
        </script>
        """
        html(copy_log_button_html, height=50)

        if st.session_state.get("is_history_shown") != True:
            if st.button("Display History as Code Block"):
                st.session_state.is_history_shown = True
                st.rerun()
        else:
            if st.button("Hide History"):
                st.session_state.is_history_shown = False
                st.rerun()
            st.code(log_text)
            
        st.session_state.is_delete_mode = st.toggle("Enable Delete button")
        st.session_state.use_continue = st.toggle("Use Continue instead of Retry", value=st.session_state.use_continue)
        
        st.header("Advanced Settings")
        model_list = ["claude-sonnet-4-5-20250929",
                      "claude-opus-4-5-20251101",
                      "claude-haiku-4-5-20251001",
                      "claude-opus-4-1-20250805",
                      "claude-opus-4-20250514",
                      "claude-sonnet-4-20250514",
                      "claude-3-7-sonnet-20250219",
                      "claude-3-5-haiku-20241022",
                      "claude-3-haiku-20240307",
                      "claude-3-opus-20240229",
                      ]
        model = st.selectbox("Model", options=model_list, index=0)
        system_prompt = st.text_area("System prompt", height=200)
    
        st.session_state.prefill = st.text_area("Prefill", height=68, value=st.session_state.prefill,
                                                help="You can prefill the assistant's responses. You can also directly type the @prefill command into the chat field (e.g., \"Write a novel. @prefill Sure! I'd be happy to write a novel for you.\")")
        save_prefill = st.toggle("Save the @prefill command input in the sidebar", value=True)
        
        temperature = st.slider("Temperature", min_value=0.0, max_value=1.0, value=1.0, step=0.1)
        top_k = st.slider("Top-K", min_value=0, max_value=500, value=0, step=1)
        top_p = st.slider("Top-P", min_value=0.01, max_value=1.00, value=1.00, step=0.01)
        max_tokens = st.slider("Max Output Tokens", min_value=1, max_value=4096, value=4096, step=1)

        st.header("Extended Thinking")
        st.session_state.use_thinking = st.toggle(
            "Enable extended thinking", 
            value=st.session_state.use_thinking,
            help="Enable Claude's enhanced reasoning capabilities"
        )
        if st.session_state.use_thinking:
            st.session_state.thinking_budget_tokens = st.slider(
                "Thinking budget tokens", 
                min_value=1024, 
                max_value=4000, 
                value=st.session_state.thinking_budget_tokens, 
                step=100,
                help="Maximum tokens Claude can use for internal reasoning"
            )
            
            # Check relationship between max_tokens and budget_tokens
            if st.session_state.thinking_budget_tokens >= max_tokens:
                st.warning("Thinking budget tokens must be less than Max Output Tokens")
        
        st.header("Context limitation")
        col_limit_val, col_limit_unit = st.columns([1, 1])
        with col_limit_val:
            limit_val = st.number_input("Limit", min_value=0, max_value=200000, value="min", help="0 means no limit")
        with col_limit_unit:
            limit_unit = st.selectbox("Unit", options=["Turns","Tokens"], index=0, help="Tokens Unit is a rough estimate")

        st.header("Tokens")
        st.session_state.show_message_tokens = st.toggle("Show message tokens")
        system_prompt_tokens = count_tokens(system_prompt)
        prefill_tokens = count_tokens(st.session_state.prefill)
        messages_tokens = 0
        for message in st.session_state.messages:
            messages_tokens += count_tokens(message["content"])
        total_tokens = system_prompt_tokens + prefill_tokens + messages_tokens

        tokens_table_md = f"| Part | Tokens |\n"
        tokens_table_md += f"| ---- | ---- |\n"
        tokens_table_md += f"| System | {system_prompt_tokens} |\n"
        tokens_table_md += f"| Prefill | {prefill_tokens} |\n"
        tokens_table_md += f"| Message | {messages_tokens}({len(st.session_state.messages)}) |\n"
        tokens_table_md += f"| Total | {total_tokens} |\n\n"
        tokens_table_md += f"These token counts are very rough estimates.\n"
        st.markdown(tokens_table_md)

        st.header("Restore History")
        history_input = st.text_area("Paste conversation history:", height=200)
        if st.button("Restore History"):
            st.session_state.messages = []
            st.session_state.exception = None
            messages = re.split(r"^(<USER>|<ASSISTANT>)\n", history_input, flags=re.MULTILINE)
            role = None
            text = ""
            for message in messages:
                if message.strip() in ["<USER>", "<ASSISTANT>"]:
                    if role and text:
                        if role == "assistant":
                            thinking_match = re.search(r"<THINKING>\n(.*?)</THINKING>\n", text, re.DOTALL)
                            if thinking_match:
                                thinking_content = thinking_match.group(1).strip()
                                content = re.sub(r"<THINKING>\n.*?</THINKING>\n", "", text, flags=re.DOTALL).strip()
                                st.session_state.messages.append({
                                    "role": role, 
                                    "content": content,
                                    "thinking": thinking_content
                                })
                            else:
                                st.session_state.messages.append({"role": role, "content": text.strip()})
                        else:
                            st.session_state.messages.append({"role": role, "content": text.strip()})
                        text = ""
                    role = "user" if message.strip() == "<USER>" else "assistant"
                else:
                    text += message
            
            if role and text:
                if role == "assistant":
                    thinking_match = re.search(r"<THINKING>\n(.*?)</THINKING>\n", text, re.DOTALL)
                    if thinking_match:
                        thinking_content = thinking_match.group(1).strip()
                        content = re.sub(r"<THINKING>\n.*?</THINKING>\n", "", text, flags=re.DOTALL).strip()
                        st.session_state.messages.append({
                            "role": role, 
                            "content": content,
                            "thinking": thinking_content
                        })
                    else:
                        st.session_state.messages.append({"role": role, "content": text.strip()})
                else:
                    st.session_state.messages.append({"role": role, "content": text.strip()})
            st.rerun()
    
        st.header("Clear History")
        if st.button("Clear Chat History"):
            st.session_state.messages = []
            st.session_state.exception = None
            st.rerun()
        
        st.header("Change API Key")
        new_api_key = st.text_input("Enter new API Key", type="password")
        if st.button("Update API Key"):
            if new_api_key:
                st.session_state.api_key = new_api_key
                client = anthropic.Anthropic(api_key=new_api_key)
                st.success("API Key updated successfully!")
            else:
                st.warning("Please enter a valid API Key.")
    
    with appearance_tab:
        st.header("Font Selection")
        font_options = {
            "Zen Maru Gothic": "Zen Maru Gothic",
            "Noto Sans JP": "Noto Sans JP",
            "Sawarabi Mincho": "Sawarabi Mincho"
        }
        selected_font = st.selectbox("Choose a font", ["Default"] + list(font_options.keys()))

        st.header("Change the font size")
        st.session_state.font_size  = st.slider("Font size", min_value=16.0, max_value=50.0, value=16.0, step=1.0)
        
        st.header("Change the user's icon")
        st.session_state.user_avatar = st.file_uploader("Choose an image", type=["png", "jpg", "jpeg", "webp", "gif", "bmp", "svg",], key="user_avatar_uploader")
    
        st.header("Change the assistant's icon")
        st.session_state.assistant_avatar = st.file_uploader("Choose an image", type=["png", "jpg", "jpeg", "webp", "gif", "bmp", "svg",], key="assistant_avatar_uploader")

        st.header("Change the icon size")
        st.session_state.avatar_size  = st.slider("Icon size", min_value=2.0, max_value=20.0, value=2.0, step=0.2)
        
# After Stop generating
if st.session_state.get("is_streaming"):
    message_content = {"role": "assistant", "content": st.session_state.response}
    if st.session_state.last_thinking:
        message_content["thinking"] = st.session_state.last_thinking
    
    st.session_state.messages.append(message_content)
    st.session_state.is_streaming = False
    if "retry_flag" in st.session_state and st.session_state.retry_flag:
        st.session_state.retry_flag = False
        st.session_state.message_continue = ""
    st.rerun()

# Change the font
if selected_font != "Default":
    with open("style.css") as css:
        st.markdown(f'<style>{css.read()}</style>', unsafe_allow_html=True)
    st.markdown(f'<style>body * {{ font-family: "{font_options[selected_font]}", serif !important; }}</style>', unsafe_allow_html=True)

# Change font size
st.markdown(f'<style>[data-testid="stChatMessageContent"] .st-emotion-cache-kj6hex p{{font-size: {st.session_state.font_size}px;}}</style>', unsafe_allow_html=True)

# Change icon size
# (CSS element names may be subject to change.)
# (Contributor: ★31 >>538)
AVATAR_SIZE_STYLE = f"""
                <style>
                    [data-testid="stChatMessageAvatarUser"] {{
                        width: {st.session_state.avatar_size}rem;
                        height: {st.session_state.avatar_size}rem;
                    }}
                    [data-testid="stChatMessageAvatarAssistant"] {{
                        width: {st.session_state.avatar_size}rem;
                        height: {st.session_state.avatar_size}rem;
                    }}
                    [data-testid="stChatMessage"] .st-emotion-cache-1pbsqtx {{
                        width: {st.session_state.avatar_size / 1.6}rem;
                        height: {st.session_state.avatar_size / 1.6}rem;
                    }}
                    [data-testid="stChatMessage"] .st-emotion-cache-p4micv {{
                        width: {st.session_state.avatar_size}rem;
                        height: {st.session_state.avatar_size}rem;
                    }}
                </style>
"""
st.markdown(AVATAR_SIZE_STYLE, unsafe_allow_html=True)

display_messages()

# After Retry
if st.session_state.get("retry_flag"):
    if len(st.session_state.messages) > 0:
        messages = st.session_state.messages.copy()
        
        response = get_ai_response(messages)
        
        message_content = {"role": "assistant", "content": response}
        if st.session_state.last_thinking:
            message_content["thinking"] = st.session_state.last_thinking
            
        st.session_state.messages.append(message_content)

        st.session_state.retry_flag = False
        st.session_state.message_continue = ""
        st.rerun()
            
    else:
        st.session_state.retry_flag = False
        st.session_state.message_continue = ""

if prompt := st.chat_input("Enter your message here..."):
    used_prefill = False
    prefill_pattern = r"([@＠](prefill|ぷれふぃる|プレフィル)\s?(.*))"
    prefill_match = re.search(prefill_pattern, prompt)

    if prefill_match:
        used_prefill = True
        if not save_prefill:
            original_prefill = st.session_state.prefill
        st.session_state.prefill = prefill_match.group(3)
        prompt = prompt.replace(prefill_match.group(1), '')

    st.session_state.messages.append({"role": "user", "content": prompt})
    messages = st.session_state.messages.copy()

    shown_message = prompt.replace("\n", "  \n")\
                          .replace("<", "\\<")\
                          .replace(">", "\\>")

    with st.chat_message("user", avatar=st.session_state.user_avatar):
        st.write(shown_message)

    response = get_ai_response(messages)

    message_content = {"role": "assistant", "content": response}
    if st.session_state.last_thinking:
        message_content["thinking"] = st.session_state.last_thinking
        
    st.session_state.messages.append(message_content)

    if used_prefill and not save_prefill:
        st.session_state.prefill = original_prefill
    
    st.rerun()