Spaces:

coztomate
/

artspeak

Runtime error

App Files Files Community

coztomate commited on Jan 3, 2024

Commit

4a5fd46

1 Parent(s): fceb790

added config

Browse files

Files changed (2) hide show

app.py +68 -81
config_llm.py +15 -0

app.py CHANGED Viewed

@@ -5,29 +5,54 @@ import io
 from openai import OpenAI
 from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 from text_generation import Client
-hf_key_mistral = st.secrets["hf_key"]
-from huggingface_hub import InferenceClient
-client = InferenceClient(token=hf_key_mistral)
-# load the simplifier model
-# Load the tokenizer and model (do this outside the function for efficiency)
 tokenizer = AutoTokenizer.from_pretrained("mrm8488/t5-small-finetuned-text-simplification")
 model = AutoModelForSeq2SeqLM.from_pretrained("mrm8488/t5-small-finetuned-text-simplification")
 def simplify_text(input_text):
     # Tokenize and encode the input text
     input_ids = tokenizer.encode("simplify: " + input_text, return_tensors="pt")
     # Generate the simplified text
     output = model.generate(input_ids, min_length=5, max_length=80, do_sample=True)
     # Decode the simplified text
     simplified_text = tokenizer.decode(output[0], skip_special_tokens=True)
     # Post-process to ensure the output ends with a complete sentence
     # Find the last period, question mark, or exclamation point
     last_valid_ending = max(simplified_text.rfind('.'), simplified_text.rfind('?'), simplified_text.rfind('!'))
@@ -37,10 +62,10 @@ def simplify_text(input_text):
     else:
         # No sentence ending found; return the whole text or handle as appropriate
         cleaned_text = simplified_text
     return cleaned_text
-# Define the path to your example text
 example_text_path = "example_text.txt"
 # Function to load example text from a file
@@ -60,45 +85,19 @@ def load_image(image_path):
         img.load()
     return img
-# Initialize session state variables
-if 'user_input' not in st.session_state:
-    st.session_state['user_input'] = ""
-if 'simplified_text' not in st.session_state:
-    st.session_state['simplified_text'] = ''
-if 'new_caption' not in st.session_state:
-    st.session_state['new_caption'] = None
-if 'model_clip' not in st.session_state:
-    st.session_state['model_clip'] = None
-if 'transform_clip' not in st.session_state:
-    st.session_state['transform_clip'] = None
-if 'openai_api_key' not in st.session_state:
-    st.session_state['openai_api_key'] = ''
-if 'message_content_from_caption' not in st.session_state:
-    st.session_state['message_content_from_caption'] = ''
-if 'message_content_from_simplified_text' not in st.session_state:
-    st.session_state['message_content_from_simplified_text'] = ''
-if 'mistral_from_caption' not in st.session_state:
-    st.session_state['mistral_from_caption'] = ''
-if 'mistral_from_simplified' not in st.session_state:
-    st.session_state['mistral_from_simplified'] = ''
-if 'image_from_caption' not in st.session_state:
-    st.session_state['image_from_caption'] = None
-if 'image_from_simplified_text' not in st.session_state:
-    st.session_state['image_from_simplified_text'] = None
-if 'image_from_press_text' not in st.session_state:
-    st.session_state['image_from_press_text'] = None
-if 'image_from_press_text_from_caption' not in st.session_state:
-    st.session_state['image_from_press_text_from_caption'] = None
-################################################
 # Create a Streamlit app
 st.title("ARTSPEAK  >  s i m p l i f i e r")
 st.markdown("---")
-# Create a sub-section
 with st.expander("Upload Files"):
         st.markdown("## Upload Text and Image")
         ##### Upload of files
@@ -124,10 +123,11 @@ with st.expander("Upload Files"):
 st.markdown("---")
-#### Simplifier
 with st.expander("Simplify Text and Image"):
     st.markdown("## 'Simplify' Text and Image")
     if st.button("Simplify the Input Text"):
         if user_input:
             simplified_text = simplify_text(user_input)
@@ -139,8 +139,7 @@ with st.expander("Simplify Text and Image"):
     if st.session_state['simplified_text']:
         st.write(st.session_state['simplified_text'])
-    ####Get new caption
     # Button to get new caption
     if st.button("Get New Caption for Image"):
         # Initialize image data variable
@@ -164,7 +163,7 @@ with st.expander("Simplify Text and Image"):
                 caption = client.image_to_text(image_data)
                 # Update the session state
                 st.session_state['new_caption'] = caption
-                st.write(f"New Caption for your Image: {caption}")
             except Exception as e:
                 st.error(f"An error occurred: {e}")
@@ -182,41 +181,29 @@ with st.expander("Press Text Generation"):
     # Define radio button options
     option = st.radio(
         "Choose a Language Model:",
-        ('Mistral 8x7B (free)', 'GPT-3.5 Turbo (needs API Key)'))
     # Conditional logic based on radio button choice
-    if option == 'Mistral 8x7B (free)':
         st.header("Mistral 8x7B")
         ############
         ###Mistral##
         ############
-        #defaults for Mistral
-        DEFAULT_SYSTEM_PROMPT = "You will be given a very short description of a contemporary artwork. Please create a complex exhibition press text based on the given artwork description using international art english dealing with post-colonialism, military industrial complex, anthropocene, identity politics and queerness through the language of Rancière, Fontane, Paglen, Deleuze, Steyerl, Spivak, Preciado, Žižek, Foucault and Harraway. Avoid excessive namedropping. Just output press text without explaining your actions."
-        MAX_MAX_NEW_TOKENS = 4096
-        DEFAULT_MAX_NEW_TOKENS = 1000
-        EOS_STRING = "</s>"
-        EOT_STRING = "<EOT>"
-        model_id_mistral = "mistralai/Mixtral-8x7B-Instruct-v0.1"
-        API_URL = "https://api-inference.huggingface.co/models/" + model_id_mistral
-        headers = {"Authorization": f"Bearer {hf_key_mistral}"}
         client_mistral = Client(
-            API_URL,
             headers=headers,
         )
         def run_single_input(
             message: str,
-            system_prompt: str,
-            max_new_tokens: int = 2048,
-            temperature: float = 0.3,
-            top_p: float = 0.9,
-            top_k: int = 50,
         ) -> str:
             """
             Run the model for a single input and return a single output.
@@ -227,13 +214,12 @@ with st.expander("Press Text Generation"):
                 max_new_tokens=max_new_tokens,
                 do_sample=True,
                 top_p=top_p,
-                top_k=top_k,
                 temperature=temperature,
             )
             stream = client_mistral.generate_stream(prompt, **generate_kwargs)
             output = ""
             for response in stream:
-                if any([end_token in response.token.text for end_token in [EOS_STRING, EOT_STRING]]):
                     break  # Stop at the first end token
                 else:
                     output += response.token.text
@@ -245,7 +231,7 @@ with st.expander("Press Text Generation"):
         if st.button("Generate Press Text from New Image Caption with Mistral"):
             if st.session_state['new_caption']:
                 try:
-                    st.session_state['mistral_from_caption'] = run_single_input(st.session_state['new_caption'], DEFAULT_SYSTEM_PROMPT)
                 except Exception as e:
                     st.error(f"An error occurred: {e}")
             else:
@@ -260,7 +246,7 @@ with st.expander("Press Text Generation"):
         if st.button("Generate Press Text from Simplified Text with Mistral"):
             if st.session_state['simplified_text']:
                 try:
-                    st.session_state['mistral_from_simplified'] = run_single_input(st.session_state['simplified_text'], DEFAULT_SYSTEM_PROMPT)
                 except Exception as e:
                     st.error(f"An error occurred: {e}")
             else:
@@ -271,14 +257,12 @@ with st.expander("Press Text Generation"):
             st.write("Generated Press Text from Simplified Text:")
             st.write(st.session_state['mistral_from_simplified'])
-    elif option == 'GPT-3.5 Turbo (needs API Key)':
         st.header("GPT-3.5")
-        #######
-        #OpenAI API
-        #######
         # Add a text input for the OpenAI API key
         api_key_input = st.text_input("Enter your OpenAI API key to continue", type="password")
@@ -293,8 +277,11 @@ with st.expander("Press Text Generation"):
             client = OpenAI(api_key=api_key,)
             completion = client.chat.completions.create(
                 model="gpt-3.5-turbo",
                 messages=[
-                    {"role": "system", "content": "I give a short description of an artwork. Please create a complex exhibition press text based on the given artwork description using international art english dealing with post-colonialism, military industrial complex, anthropocene, identity politics and queerness through the language of Rancière, Fontane, Paglen, Deleuze, Steyerl, Spivak, Preciado, Žižek, Foucault and Harraway. Avoid excessive namedropping. Just output press text without explaining your actions."},
                     {"role": "user", "content": prompt_message}
                 ]
             )
@@ -333,9 +320,9 @@ with st.expander("Press Text Generation"):
 st.markdown("---")
-############
-##Diffusor##
-############
 with st.expander("Image Generation"):
     st.markdown("## Generate new Images from Texts")

 from openai import OpenAI
 from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 from text_generation import Client
+from huggingface_hub import InferenceClient
+import config_llm
+# Initialize session state variables
+if 'user_input' not in st.session_state:
+    st.session_state['user_input'] = ""
+if 'simplified_text' not in st.session_state:
+    st.session_state['simplified_text'] = ''
+if 'new_caption' not in st.session_state:
+    st.session_state['new_caption'] = None
+if 'model_clip' not in st.session_state:
+    st.session_state['model_clip'] = None
+if 'transform_clip' not in st.session_state:
+    st.session_state['transform_clip'] = None
+if 'openai_api_key' not in st.session_state:
+    st.session_state['openai_api_key'] = ''
+if 'huggingface_key' not in st.session_state:
+    st.session_state['huggingface_key'] = ''
+if 'message_content_from_caption' not in st.session_state:
+    st.session_state['message_content_from_caption'] = ''
+if 'message_content_from_simplified_text' not in st.session_state:
+    st.session_state['message_content_from_simplified_text'] = ''
+if 'mistral_from_caption' not in st.session_state:
+    st.session_state['mistral_from_caption'] = ''
+if 'mistral_from_simplified' not in st.session_state:
+    st.session_state['mistral_from_simplified'] = ''
+if 'image_from_caption' not in st.session_state:
+    st.session_state['image_from_caption'] = None
+if 'image_from_simplified_text' not in st.session_state:
+    st.session_state['image_from_simplified_text'] = None
+if 'image_from_press_text' not in st.session_state:
+    st.session_state['image_from_press_text'] = None
+if 'image_from_press_text_from_caption' not in st.session_state:
+    st.session_state['image_from_press_text_from_caption'] = None
+# Load the tokenizer and simplifier model
 tokenizer = AutoTokenizer.from_pretrained("mrm8488/t5-small-finetuned-text-simplification")
 model = AutoModelForSeq2SeqLM.from_pretrained("mrm8488/t5-small-finetuned-text-simplification")
+# Function to simplify text
 def simplify_text(input_text):
     # Tokenize and encode the input text
     input_ids = tokenizer.encode("simplify: " + input_text, return_tensors="pt")
     # Generate the simplified text
     output = model.generate(input_ids, min_length=5, max_length=80, do_sample=True)
     # Decode the simplified text
     simplified_text = tokenizer.decode(output[0], skip_special_tokens=True)
     # Post-process to ensure the output ends with a complete sentence
     # Find the last period, question mark, or exclamation point
     last_valid_ending = max(simplified_text.rfind('.'), simplified_text.rfind('?'), simplified_text.rfind('!'))
     else:
         # No sentence ending found; return the whole text or handle as appropriate
         cleaned_text = simplified_text
     return cleaned_text
+# Define the path to example text
 example_text_path = "example_text.txt"
 # Function to load example text from a file
         img.load()
     return img
+#get huggingface key
+st.session_state['huggingface_key'] = st.secrets["hf_key"]
+client = InferenceClient(token=st.session_state['huggingface_key'])
+########################################################################
 # Create a Streamlit app
 st.title("ARTSPEAK  >  s i m p l i f i e r")
 st.markdown("---")
+# Create a sub-section for uploading the files
 with st.expander("Upload Files"):
         st.markdown("## Upload Text and Image")
         ##### Upload of files
 st.markdown("---")
+#### Simplifier and Image Caption
 with st.expander("Simplify Text and Image"):
     st.markdown("## 'Simplify' Text and Image")
+    ## Text simplifier
     if st.button("Simplify the Input Text"):
         if user_input:
             simplified_text = simplify_text(user_input)
     if st.session_state['simplified_text']:
         st.write(st.session_state['simplified_text'])
+    ## Get new caption
     # Button to get new caption
     if st.button("Get New Caption for Image"):
         # Initialize image data variable
                 caption = client.image_to_text(image_data)
                 # Update the session state
                 st.session_state['new_caption'] = caption
+                st.write(st.session_state['new_caption'])
             except Exception as e:
                 st.error(f"An error occurred: {e}")
     # Define radio button options
     option = st.radio(
         "Choose a Language Model:",
+        ('Mistral 8x7B', 'GPT-3.5 Turbo'))
     # Conditional logic based on radio button choice
+    if option == 'Mistral 8x7B':
         st.header("Mistral 8x7B")
         ############
         ###Mistral##
         ############
+        headers = {"Authorization": f"Bearer {st.session_state['huggingface_key']}"}
         client_mistral = Client(
+            config_llm.API_URL,
             headers=headers,
         )
         def run_single_input(
             message: str,
+            system_prompt: str = config_llm.DEFAULT_SYSTEM_PROMPT,
+            max_new_tokens: int = config_llm.MAX_NEW_TOKENS,
+            temperature: float = config_llm.TEMPERATURE,
+            top_p: float = config_llm.TOP_P
         ) -> str:
             """
             Run the model for a single input and return a single output.
                 max_new_tokens=max_new_tokens,
                 do_sample=True,
                 top_p=top_p,
                 temperature=temperature,
             )
             stream = client_mistral.generate_stream(prompt, **generate_kwargs)
             output = ""
             for response in stream:
+                if any([end_token in response.token.text for end_token in [config_llm.EOS_STRING, config_llm.EOT_STRING]]):
                     break  # Stop at the first end token
                 else:
                     output += response.token.text
         if st.button("Generate Press Text from New Image Caption with Mistral"):
             if st.session_state['new_caption']:
                 try:
+                    st.session_state['mistral_from_caption'] = run_single_input(st.session_state['new_caption'], config_llm.DEFAULT_SYSTEM_PROMPT)
                 except Exception as e:
                     st.error(f"An error occurred: {e}")
             else:
         if st.button("Generate Press Text from Simplified Text with Mistral"):
             if st.session_state['simplified_text']:
                 try:
+                    st.session_state['mistral_from_simplified'] = run_single_input(st.session_state['simplified_text'], config_llm.DEFAULT_SYSTEM_PROMPT)
                 except Exception as e:
                     st.error(f"An error occurred: {e}")
             else:
             st.write("Generated Press Text from Simplified Text:")
             st.write(st.session_state['mistral_from_simplified'])
+    elif option == 'GPT-3.5 Turbo':
         st.header("GPT-3.5")
+        ##########
+        ##OpenAI##
+        #########
         # Add a text input for the OpenAI API key
         api_key_input = st.text_input("Enter your OpenAI API key to continue", type="password")
             client = OpenAI(api_key=api_key,)
             completion = client.chat.completions.create(
                 model="gpt-3.5-turbo",
+                max_tokens=config_llm.MAX_NEW_TOKENS,
+                temperature = config_llm.TEMPERATURE,
+                top_p = config_llm.TOP_P,
                 messages=[
+                    {"role": "system", "content": config_llm.DEFAULT_SYSTEM_PROMPT},
                     {"role": "user", "content": prompt_message}
                 ]
             )
 st.markdown("---")
+########################################################################
+## Image Generation Interface
 with st.expander("Image Generation"):
     st.markdown("## Generate new Images from Texts")

config_llm.py ADDED Viewed

	@@ -0,0 +1,15 @@

+# Configuration and Constants
+# Defaults for Mistral/OpenAI
+DEFAULT_SYSTEM_PROMPT = "You will be given a very short description of a contemporary artwork. Please create a complex exhibition press text based on the given artwork description using international art english dealing with post-colonialism, military industrial complex, anthropocene, identity politics and queerness through the language of Rancière, Fontane, Paglen, Deleuze, Steyerl, Spivak, Preciado, Žižek, Foucault and Harraway. Avoid excessive namedropping. Just output press text without explaining your actions."
+EOS_STRING = "</s>"
+EOT_STRING = "<EOT>"
+# Mistral Model Configuration
+model_id_mistral = "mistralai/Mixtral-8x7B-Instruct-v0.1"
+API_URL = f"https://api-inference.huggingface.co/models/{model_id_mistral}"
+#model parameters
+MAX_NEW_TOKENS = 2048
+TEMPERATURE = 0.7
+TOP_P = 0.8