Spaces:

d221
/

Everyday_Assistant

Sleeping

App Files Files Community

d221 commited on Feb 1, 2025

Commit

e22dcdd

verified ·

1 Parent(s): 2570514

Update app.py

Browse files

Files changed (1) hide show

app.py +154 -92

app.py CHANGED Viewed

@@ -1,139 +1,201 @@
 import os
 import gradio as gr
 from huggingface_hub import InferenceClient
-AVAILABLE_MODELS = [
-    "bigscience/bloom-560m",        # Smaller, faster version of BLOOM
-    "bigscience/bloom",            # Original 176B parameter Bloom (heavy)
-    "openlm-research/open_llama_3b",  # Smaller 3B LLaMA-like model
-    "openlm-research/open_llama_7b",  # 7B LLaMA-like model
-    "tiiuae/falcon-7b-instruct",   # Falcon 7B instruct
-    "OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5",  # OpenAssistant 12B
-    # Add any other open-source models from HF you like
 ]
 def chat_with_model(
-    user_message,       # The user’s message
-    history,            # Chat history (handled automatically by Gradio ChatInterface)
-    system_message,     # The system message/instructions from the left panel
-    user_api_key,       # Optional user-provided HF API key
-    model_choice,       # The model chosen from the dropdown
-    max_tokens,         # Max new tokens
-    temperature,        # Temperature
-    top_p               # Top-p
 ):
     """
-    Called every time a user sends a new message.
-    Uses either the user’s provided HF API key or
-    does public inference (anonymous) if none is supplied.
     """
-    # Decide which key to use
-    final_api_key = user_api_key.strip() if user_api_key else None  # None -> public/no token
-    # Initialize InferenceClient with the chosen API key
-    client = InferenceClient(token=final_api_key)
-    # Build the prompt or system instruction
-    # You can handle chat format in a variety of ways.
-    # For simplicity, we do a naive approach here:
-    prompt = (
-        f"{system_message.strip()}\n\n"  # System instructions
-        f"User: {user_message}\n"
-        "Assistant:"
-    )
-    # Set generation parameters
-    generation_params = dict(
-        temperature=temperature,
-        max_new_tokens=int(max_tokens),
-        top_p=top_p,
-        # Some open-source models do better with a smaller
-        # repetition_penalty or none at all:
-        repetition_penalty=1.0,
-    )
-    # Perform streaming text generation
     partial_response = ""
-    stream = client.text_generation(
-        prompt=prompt,
-        model=model_choice,    # The user's chosen model
-        stream=True,
-        details=True,
-        **generation_params
-    )
-    for chunk in stream:
-        if chunk.token.special:
-            continue
-        partial_response += chunk.token.text
-        yield partial_response
-with gr.Blocks(theme="soft") as demo:
-    # Title
     gr.Markdown(
         """
-        <h1 style="text-align:center; margin-bottom: 5px;">
-            <b>Open-Source GPT Chatbot</b>
-        </h1>
-        """,
-        elem_id="title"
     )
     with gr.Row():
-        # Left Column: system msg, HF API key, model dropdown, sliders, etc.
-        with gr.Column(scale=1, min_width=270):
             system_message = gr.Textbox(
                 label="System Message",
-                value="You are a helpful open-source AI assistant."
             )
-            user_api_key = gr.Textbox(
-                label="Hugging Face API Key (optional)",
-                type="password",
-                placeholder="Leave blank for public/anonymous usage"
             )
-            model_choice = gr.Dropdown(
-                label="Select Open-Source Model",
-                choices=AVAILABLE_MODELS,
-                value=AVAILABLE_MODELS[0],  # Default to first in list
             )
             max_tokens = gr.Slider(
                 minimum=1,
                 maximum=2000,
-                step=1,
                 value=512,
-                label="Max new tokens"
             )
             temperature = gr.Slider(
-                minimum=0.1,
                 maximum=2.0,
                 value=0.7,
-                step=0.1,
-                label="Temperature"
             )
             top_p = gr.Slider(
                 minimum=0.1,
                 maximum=1.0,
                 value=0.9,
-                step=0.01,
-                label="Top-p (nucleus sampling)"
             )
-        # Right Column: The chat interface
         with gr.Column(scale=3):
             chatbot = gr.ChatInterface(
                 fn=chat_with_model,
-                # Additional inputs needed by chat_with_model:
-                additional_inputs=[system_message, user_api_key, model_choice,
-                                   max_tokens, temperature, top_p],
-                type="messages",  # Use newer messages format
-                title="Open-Source Chatbot"
             )
-    # Launch the Gradio app
     demo.launch()

 import os
 import gradio as gr
+import openai
+import requests
 from huggingface_hub import InferenceClient
+###############################################################################
+# 1. List of Models: Some open-source (HF), some require paid API (OpenAI)
+###############################################################################
+MODEL_OPTIONS = [
+    # Open-Source (Hugging Face)
+    "Open-Source: bigscience/bloom-560m",
+    "Open-Source: tiiuae/falcon-7b-instruct",
+    "Open-Source: openlm-research/open_llama_7b",
+    # Paid (OpenAI) - require a valid OPENAI API key
+    "OpenAI: gpt-3.5-turbo",
+    "OpenAI: gpt-4",
 ]
+###############################################################################
+# 2. Chat function
+###############################################################################
 def chat_with_model(
+    user_message,        # user's text input
+    history,             # chat history (handled by ChatInterface)
+    system_message,      # system instructions
+    chosen_model,        # which model from the dropdown
+    user_model_api_key,  # user-supplied API key for the chosen model
+    max_tokens,
+    temperature,
+    top_p
 ):
     """
+    Depending on the user’s chosen model:
+      - If it starts with "Open-Source:", we call Hugging Face InferenceClient
+      - If it starts with "OpenAI:", we call the OpenAI ChatCompletion endpoint
+    For open-source, the API key can be left blank (anonymous).
+    For paid, an API key must be supplied.
     """
+    # Standard system text (if user left it empty, we provide a default)
+    system_text = system_message.strip() or "You are a helpful AI assistant."
+    # We'll build partial output as we stream
     partial_response = ""
+    ###############################
+    # CASE A: OPEN-SOURCE (HF)
+    ###############################
+    if chosen_model.startswith("Open-Source:"):
+        # Extract the actual HF model name
+        hf_model = chosen_model.split("Open-Source:")[1].strip()
+        # If the user gave an API key, we use it; otherwise None => anonymous
+        hf_token = user_model_api_key.strip() if user_model_api_key else None
+        client = InferenceClient(token=hf_token)
+        # Build a naive prompt
+        prompt = (
+            f"{system_text}\n\n"
+            f"User: {user_message}\n"
+            "Assistant:"
+        )
+        generation_params = dict(
+            temperature=temperature,
+            max_new_tokens=int(max_tokens),
+            top_p=top_p,
+            repetition_penalty=1.0
+        )
+        try:
+            response_stream = client.text_generation(
+                prompt=prompt,
+                model=hf_model,
+                stream=True,
+                details=True,
+                **generation_params
+            )
+            for chunk in response_stream:
+                if chunk.token.special:
+                    continue
+                partial_response += chunk.token.text
+                yield partial_response
+        except Exception as e:
+            yield f"Error calling Hugging Face Inference API: {str(e)}"
+            return
+    ###############################
+    # CASE B: OPENAI
+    ###############################
+    else:
+        # Must have an API key
+        if not user_model_api_key.strip():
+            yield "Error: This model requires a paid API key. Please provide a valid one."
+            return
+        openai.api_key = user_model_api_key.strip()
+        openai_model_name = chosen_model.split("OpenAI:")[1].strip()  # e.g. "gpt-4"
+        # Build OpenAI chat messages
+        messages = [
+            {"role": "system", "content": system_text},
+            {"role": "user", "content": user_message}
+        ]
+        try:
+            response = openai.ChatCompletion.create(
+                model=openai_model_name,
+                messages=messages,
+                temperature=temperature,
+                max_tokens=int(max_tokens),
+                top_p=top_p,
+                stream=True
+            )
+            for chunk in response:
+                if "choices" in chunk and len(chunk["choices"]) > 0:
+                    delta = chunk["choices"][0]["delta"]
+                    if "content" in delta:
+                        partial_response += delta["content"]
+                        yield partial_response
+        except Exception as e:
+            yield f"Error calling OpenAI API: {str(e)}"
+            return
+###############################################################################
+# 3. Build the Gradio Interface
+###############################################################################
+with gr.Blocks() as demo:
     gr.Markdown(
         """
+        # Multi-Model Chatbot
+        Choose from open-source or paid models, and provide an API key if needed.
+        """
     )
     with gr.Row():
+        # Left column for parameters
+        with gr.Column(scale=1, min_width=300):
             system_message = gr.Textbox(
                 label="System Message",
+                value="You are a helpful open-source AI assistant.",
+                lines=3,
             )
+            # Let user pick model first
+            chosen_model = gr.Dropdown(
+                label="Select a Model for Your ChatBot",
+                choices=MODEL_OPTIONS,
+                value=MODEL_OPTIONS[0],  # default to the first
+                info="Open-Source models can be used anonymously. Paid models require a valid API key."
             )
+            # Then the API key tile
+            user_model_api_key = gr.Textbox(
+                label="API Key for the Chosen Model",
+                placeholder="Required if you selected a paid model like GPT-4; optional otherwise",
+                type="password"
             )
             max_tokens = gr.Slider(
+                label="Max Tokens",
                 minimum=1,
                 maximum=2000,
                 value=512,
+                step=1
             )
             temperature = gr.Slider(
+                label="Temperature",
+                minimum=0.0,
                 maximum=2.0,
                 value=0.7,
+                step=0.1
             )
             top_p = gr.Slider(
+                label="Top-p",
                 minimum=0.1,
                 maximum=1.0,
                 value=0.9,
+                step=0.01
             )
+        # Right column for the chat interface
         with gr.Column(scale=3):
             chatbot = gr.ChatInterface(
                 fn=chat_with_model,
+                # extra inputs
+                additional_inputs=[
+                    system_message,
+                    chosen_model,
+                    user_model_api_key,
+                    max_tokens,
+                    temperature,
+                    top_p
+                ],
+                type="messages"
             )
     demo.launch()