Spaces:

AiKontent
/

test-chatbots

Runtime error

App Files Files Community

vmoras commited on Feb 17, 2024

Commit

5d345b1

1 Parent(s): c134e34

Initial commit

Browse files

Files changed (4) hide show

.gitignore +5 -0
main.py +35 -0
requirements.txt +6 -0
utils.py +238 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,5 @@

+__pycache__/
+.idea/
+.env
+prompts/

main.py ADDED Viewed

	@@ -0,0 +1,35 @@

+from dotenv import load_dotenv
+load_dotenv()
+import os
+import utils
+import gradio as gr
+with gr.Blocks() as app:
+    with gr.Row() as selection:
+        model = gr.Dropdown(choices=[model for model in utils.MODELS], label='Select Model')
+        start_button = gr.Button(value='Start Test')
+    restart_button = gr.Button(value='Restart Test', visible=False)
+    with gr.Column(visible=False) as testing:
+        name_model = gr.Markdown()
+        chatbot = gr.Chatbot(label='Chatbot')
+        message = gr.Text(label='Enter your message')
+    # Init the chatbot
+    start_button.click(
+        utils.start_chat, model, [selection, restart_button, testing, name_model]
+    )
+    # Select again the model
+    restart_button.click(
+        utils.restart_chat, None, [selection, restart_button, testing, chatbot, message]
+    )
+    # Send the messages and get an answer
+    message.submit(
+        utils.get_answer, [chatbot, message, model], [chatbot, message]
+    )
+app.queue()
+app.launch(debug=True, auth=(os.environ.get('SPACE_USERNAME'), os.environ.get('SPACE_PASSWORD')))

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+gradio==4.19.0
+python-dotenv==1.0.1
+pinecone-client==2.2.4
+openai==1.6.1
+google-generativeai==0.3.2
+huggingface_hub==0.20.2

utils.py ADDED Viewed

	@@ -0,0 +1,238 @@

+import os
+import pinecone
+import gradio as gr
+from openai import OpenAI
+from typing import Callable
+import google.generativeai as genai
+from huggingface_hub import hf_hub_download
+def download_prompt(name_prompt: str) -> str:
+    """
+    Downloads prompt from HuggingFace Hub
+    :param name_prompt: name of the file
+    :return: text of the file
+    """
+    hf_hub_download(
+        repo_id=os.environ.get('DATA'), repo_type='dataset', filename=f"{name_prompt}.txt",
+        token=os.environ.get('HUB_TOKEN'), local_dir="prompts"
+    )
+    with open(f'prompts/{name_prompt}.txt', mode='r', encoding='utf-8') as infile:
+        prompt = infile.read()
+    return prompt
+def start_chat(model: str) -> tuple[gr.helpers, gr.helpers, gr.helpers, gr.helpers]:
+    """
+    Shows the chatbot interface and hides the selection of the model.
+    Returns gradio helpers (gr.update())
+    :param model: name of the model to use
+    :return: visible=False, visible=True, visible=True, value=selected_model
+    """
+    no_visible = gr.update(visible=False)
+    visible = gr.update(visible=True)
+    title = gr.update(value=f"# {model}")
+    return no_visible, visible, visible, title
+def restart_chat() -> tuple[gr.helpers, gr.helpers, gr.helpers, list, str]:
+    """
+    Shows the selection of the model, hides the chatbot interface and restarts the chatbot.
+    Returns gradio helpers (gr.update())
+    :return: visible=True, visible=False, visible=False, empty list, empty string
+    """
+    no_visible = gr.update(visible=False)
+    visible = gr.update(visible=True)
+    return visible, no_visible, no_visible, [], ""
+def get_answer(chatbot: list[tuple[str, str]], message: str, model: str) -> tuple[list[tuple[str, str]], str]:
+    """
+    Calls the model and returns the answer
+    :param chatbot: message history
+    :param message: user input
+    :param model: name of the model
+    :return: chatbot answer
+    """
+    # Setup which function will be called (depends on the model)
+    if COMPANIES[model]['real name'] == 'Gemini':
+        call_model = _call_google
+    else:
+        call_model = _call_openai
+    # Get standalone question
+    standalone_question = _get_standalone_question(chatbot, message, call_model)
+    # Get context
+    context = _get_context(standalone_question)
+    # Get answer from the Chatbot
+    prompt = PROMPT_GENERAL.replace('CONTEXT', context)
+    answer = call_model(prompt, chatbot, message)
+    # Add the new answer to the history
+    chatbot.append((message, answer))
+    return chatbot, ""
+def _get_standalone_question(
+        chat_history: list[tuple[str, str]], message: str, call_model: Callable[[str, list, str], str]
+) -> str:
+    """
+    To get a better context a standalone question is obtained for each question
+    :param chat_history: message history
+    :param message: user input
+    :param call_model: name of the model
+    :return: standalone phrase
+    """
+    # Format the message history like: Human: blablablá \nAssistant: blablablá
+    history = ''
+    for i, (user, bot) in enumerate(chat_history):
+        if i == 0:
+            history += f'Assistant: {bot}\n'
+        else:
+            history += f'Human: {user}\n'
+            history += f'Assistant: {bot}\n'
+    # Add history and question to the prompt
+    prompt = PROMPT_STANDALONE.replace('HISTORY', history)
+    question = f'Follow-up message: {message}'
+    return call_model(prompt, [], question)
+def _get_embedding(text: str) -> list[float]:
+    """
+    :param text: input text
+    :return: embedding
+    """
+    response = OPENAI_CLIENT.embeddings.create(
+        input=text,
+        model='text-embedding-ada-002'
+    )
+    return response.data[0].embedding
+def _get_context(question: str) -> str:
+    """
+    Get the 10 nearest vectors to the given input
+    :param question: standalone question
+    :return: formatted context with the nearest vectors
+    """
+    result = INDEX.query(
+        vector=_get_embedding(question),
+        top_k=10,
+        include_metadata=True,
+        namespace=f'{CLIENT}-context'
+    )['matches']
+    context = ''
+    for r in result:
+        context += r['metadata']['Text'] + '\n\n'
+    return context
+def _call_openai(prompt: str, chat_history: list[tuple[str, str]], question: str) -> str:
+    """
+    Calls ChatGPT 4
+    :param prompt: prompt with the context or the question (in the case of the standalone one)
+    :param chat_history: history of the conversation
+    :param question: user input
+    :return: chatbot answer
+    """
+    # Format the message history to the one used by OpenAI
+    msg_history = [{'role': 'system', 'content': prompt}]
+    for i, (user, bot) in enumerate(chat_history):
+        if i == 0:
+            msg_history.append({'role': 'assistant', 'content': bot})
+        else:
+            msg_history.append({'role': 'user', 'content': user})
+            msg_history.append({'role': 'assistant', 'content': bot})
+    msg_history.append({'role': 'user', 'content': question})
+    # Call ChatGPT 4
+    response = OPENAI_CLIENT.chat.completions.create(
+        model='gpt-4-turbo-preview',
+        temperature=0.5,
+        messages=msg_history
+    )
+    return response.choices[0].message.content
+def _call_google(prompt: str, chat_history: list[tuple[str, str]], question: str) -> str:
+    """
+    Calls Gemini
+    :param prompt: prompt with the context or the question (in the case of the standalone one)
+    :param chat_history: history of the conversation
+    :param question: user input
+    :return: chatbot answer
+    """
+    # Format the message history to the one used by Google
+    history = [
+        {'role': 'user', 'parts': [prompt]},
+        {'role': 'model', 'parts': 'Excelente! Estoy super lista para ayudarte en lo que necesites'}
+    ]
+    for i, (user, bot) in enumerate(chat_history):
+        if i == 0:
+            history.append({'role': 'model', 'parts': bot})
+        else:
+            history.append({'role': 'user', 'parts': user})
+            history.append({'role': 'model', 'parts': bot})
+    convo = GEMINI.start_chat(history=history)
+    # Call Gemini
+    convo.send_message(question)
+    return convo.last.text
+# ----------------------------------------- Setup constants and models ------------------------------------------------
+OPENAI_CLIENT = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
+genai.configure(api_key=os.getenv("GEMINI_API_KEY"))
+pinecone.init(api_key=os.getenv('PINECONE_API_KEY'), environment=os.getenv("PINECONE_ENVIRONMENT"))
+INDEX = pinecone.Index(os.getenv('PINECONE_INDEX'))
+CLIENT = os.getenv('CLIENT')
+# Setup Gemini
+generation_config = {
+  "temperature": 0.9,
+  "top_p": 1,
+  "top_k": 1,
+  "max_output_tokens": 2048,
+}
+safety_settings = [
+  {
+    "category": "HARM_CATEGORY_HARASSMENT",
+    "threshold": "BLOCK_MEDIUM_AND_ABOVE"
+  },
+  {
+    "category": "HARM_CATEGORY_HATE_SPEECH",
+    "threshold": "BLOCK_MEDIUM_AND_ABOVE"
+  },
+  {
+    "category": "HARM_CATEGORY_SEXUALLY_EXPLICIT",
+    "threshold": "BLOCK_ONLY_HIGH"
+  },
+  {
+    "category": "HARM_CATEGORY_DANGEROUS_CONTENT",
+    "threshold": "BLOCK_MEDIUM_AND_ABOVE"
+  },
+]
+GEMINI = genai.GenerativeModel(
+    model_name="gemini-1.0-pro", generation_config=generation_config, safety_settings=safety_settings
+)
+# Download and open prompts from HuggingFace Hub
+os.makedirs('prompts', exist_ok=True)
+PROMPT_STANDALONE = download_prompt('standalone')
+PROMPT_GENERAL = download_prompt('general')
+# Constants used in the app
+COMPANIES = {
+    'Model G': {'company': 'Google', 'real name': 'Gemini'},
+    'Model C': {'company': 'OpenAI', 'real name': 'ChatGPT 4'},
+}
+MODELS = list(COMPANIES.keys())