Spaces:

kimadams
/

ai-kit

Sleeping

App Files Files Community

Kim Adams commited on Jun 29, 2024

Commit

2cd1c76

1 Parent(s): a5d5d8d

all of the things

Browse files

Files changed (42) hide show

README.md +1 -1
app.py +11 -10
chat_bot/__pycache__/simple_chat.cpython-311.pyc +0 -0
chat_bot/__pycache__/ui_chat_bot.cpython-311.pyc +0 -0
chat_bot/__pycache__/ui_simple_chat.cpython-311.pyc +0 -0
chat_bot/simple_chat.py +148 -14
chat_bot/ui_chat_bot.py +1 -1
chat_bot/ui_simple_chat.py +5 -5
embedding_tools/__pycache__/create_embedding.cpython-311.pyc +0 -0
embedding_tools/__pycache__/embeddings.cpython-311.pyc +0 -0
embedding_tools/create_embedding.py +12 -0
embedding_tools/embeddings.py +1 -0
image_to_text/__pycache__/image_to_text_translator.cpython-311.pyc +0 -0
image_to_text/image_to_text_translator.py +1 -1
image_to_text/ui_image_to_text.py +1 -1
prompts/__pycache__/ui_prompt_builder.cpython-311.pyc +0 -0
prompts/ui_prompt_builder.py +1 -1
recording_analysis/__pycache__/ui_recording_analysis.cpython-311.pyc +0 -0
recording_analysis/ui_recording_analysis.py +18 -1
requirements.txt +13 -4
slack_sentiment_analysis/__pycache__/ui_sentiment_analysis.cpython-311.pyc +0 -0
slack_sentiment_analysis/ui_sentiment_analysis.py +1 -1
text_analysis/__pycache__/ui_text_analysis.cpython-311.pyc +0 -0
text_analysis/ui_text_analysis.py +1 -2
translators/__pycache__/translate_pdf_to_text.cpython-311.pyc +0 -0
utilities/__pycache__/api_keys.cpython-311.pyc +0 -0
utilities/__pycache__/clean_text.cpython-311.pyc +0 -0
utilities/__pycache__/constants.cpython-311.pyc +0 -0
utilities/__pycache__/date_format.cpython-311.pyc +0 -0
utilities/__pycache__/embeddings.cpython-311.pyc +0 -0
utilities/__pycache__/prompt_constants.cpython-311.pyc +0 -0
utilities/__pycache__/prompts.cpython-311.pyc +0 -0
utilities/__pycache__/system_prompts.cpython-311.pyc +0 -0
utilities/__pycache__/translate_pdf_to_text.cpython-311.pyc +0 -0
utilities/__pycache__/user_prompts.cpython-311.pyc +0 -0
utilities/__pycache__/voice_handling.cpython-311.pyc +0 -0
utilities/constants.py +17 -3
utilities/data/csv/usaa.csv +0 -0
utilities/data/embeddings/hr_asst_embeddings.pkl +1 -1
utilities/data/pkl/usaa.pkl +2 -2
utilities/data/txt/usaa.txt +0 -0
utilities/prompt_constants.py +1 -0

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 🛠️
 colorFrom: red
 colorTo: red
 sdk: gradio
-sdk_version: 3.40.1
 app_file: app.py
 pinned: false
 ---

 colorFrom: red
 colorTo: red
 sdk: gradio
+sdk_version: 4.37.2
 app_file: app.py
 pinned: false
 ---

app.py CHANGED Viewed

@@ -2,29 +2,30 @@ import gradio as gr
 import pandas as pd
 import openai
 from ui.app_theme import SoftBlue
-from image_gen import ui_image_generation
-from summarization import ui_summarize
 from utilities import constants,api_keys
-from recording_analysis import ui_recording_analysis
 from prompts import ui_prompt_builder
 from chat_bot import ui_simple_chat
 from slack_sentiment_analysis import ui_sentiment_analysis
 from image_to_text import image_to_text_translator as ui_image_to_text
-from text_analysis import ui_text_analysis
 openai.api_key = api_keys.APIKeys().get_key('OPENAI_API_KEY')
 prompt_builder=ui_prompt_builder.ui
 summarize=ui_summarize.ui
 image_generator=ui_image_generation.ui
 video_analysis=ui_recording_analysis.ui
 slack_sentiment=ui_sentiment_analysis.ui
-usaa_advisor=ui_simple_chat.ui
-image_to_text=ui_image_to_text.ui
-text_analysis=ui_text_analysis.ui
-ui = gr.TabbedInterface([prompt_builder, text_analysis, image_generator, video_analysis,slack_sentiment, usaa_advisor, summarize],
-                        (constants.UI_1, constants.UI_2, constants.UI_3,constants.UI_4, constants.UI_5,constants.UI_7, constants.UI_8),
-                        theme=SoftBlue())
 ui.launch()

 import pandas as pd
 import openai
 from ui.app_theme import SoftBlue
 from utilities import constants,api_keys
 from prompts import ui_prompt_builder
 from chat_bot import ui_simple_chat
+''' Disabled
+from image_gen import ui_image_generation
+from summarization import ui_summarize
+from recording_analysis import ui_recording_analysis
 from slack_sentiment_analysis import ui_sentiment_analysis
 from image_to_text import image_to_text_translator as ui_image_to_text
+from text_analysis import ui_text_analysis'''
 openai.api_key = api_keys.APIKeys().get_key('OPENAI_API_KEY')
 prompt_builder=ui_prompt_builder.ui
+usaa_advisor=ui_simple_chat.ui
+''' Disabled
 summarize=ui_summarize.ui
 image_generator=ui_image_generation.ui
 video_analysis=ui_recording_analysis.ui
 slack_sentiment=ui_sentiment_analysis.ui
+#git_advisor=ui_simple_chat_git.ui
+#image_to_text=ui_image_to_text.ui
+#text_analysis=ui_text_analysis.ui'''
+ui = gr.TabbedInterface([prompt_builder, usaa_advisor], (constants.UI_1, "Policy Chat"),theme=SoftBlue())
 ui.launch()

chat_bot/__pycache__/simple_chat.cpython-311.pyc DELETED Viewed

Binary file (5.34 kB)

chat_bot/__pycache__/ui_chat_bot.cpython-311.pyc DELETED Viewed

Binary file (7.07 kB)

chat_bot/__pycache__/ui_simple_chat.cpython-311.pyc DELETED Viewed

Binary file (3.41 kB)

chat_bot/simple_chat.py CHANGED Viewed

@@ -1,12 +1,158 @@
-import os, openai,string,csv
 import pandas as pd
 from utilities import constants, api_keys, clean_text, prompt_constants
 from translators import translate_pdf_to_text
 from embedding_tools import create_embedding
 openai.api_key = api_keys.APIKeys().get_key('OPENAI_API_KEY')
 messages=[]
 def CreateCSV(text_chunks):
     with open(constants.CSV_PATH, 'w', newline='') as csvfile:
         csv_writer = csv.writer(csvfile)
@@ -36,19 +182,6 @@ def CreateChunks(transcript, length):
         text_chunks.append(transcript[start_idx:])
     return text_chunks
-def CreateEmbeddings(input_path, output_path):
-    if os.path.exists(constants.PKL_PATH):
-        df = pd.read_pickle(constants.PKL_PATH)
-        create_embedding.CreateEmbeddingsFlat(constants.CSV_PATH, constants.PKL_PATH)
-        return df
-    transcript= translate_pdf_to_text.TranslatePdfToText(input_path, output_path)
-    text_chunks=CreateChunks(transcript, constants.EMBEDDING_CHUNK_LENGTH)
-    CreateCSV(text_chunks)
-    create_embedding.CreateEmbeddingsFlat(constants.CSV_PATH, constants.PKL_PATH)
-    df = pd.read_pickle(constants.PKL_PATH)
-    return df
 def Completion(messages):
     response = openai.ChatCompletion.create(
         model="gpt-3.5-turbo",
@@ -58,6 +191,7 @@ def Completion(messages):
     return cleaned_text
 def QueryEmbeddingsSimple(query):
     global messages
     best_answer= create_embedding.QueryEmbeddingsFlat(query)
     prompt= prompt_constants.USAA_AR_EXPERT_PROMPT

+import os
+import openai
+import string
+import csv
+import re
 import pandas as pd
 from utilities import constants, api_keys, clean_text, prompt_constants
 from translators import translate_pdf_to_text
 from embedding_tools import create_embedding
+from chat_bot import process_policies
 openai.api_key = api_keys.APIKeys().get_key('OPENAI_API_KEY')
 messages=[]
+def flatten_json(json_obj, prefix=''):
+    items = []
+    def flatten(json_fragment, current_prefix):
+        if isinstance(json_fragment, dict):
+            for key, value in json_fragment.items():
+                new_key = f'{current_prefix}{key}_' if current_prefix else key
+                if isinstance(value, (dict, list)):
+                    flatten(value, new_key)
+                else:
+                    # Remove newlines from value
+                    cleaned_value = str(value).replace('\n', ' ')
+                    items.append((new_key, cleaned_value))
+        elif isinstance(json_fragment, list):
+            for index, item in enumerate(json_fragment):
+                new_key = f'{current_prefix}{index}_'
+                if isinstance(item, (dict, list)):
+                    flatten(item, new_key)
+                else:
+                    # Remove newlines from value
+                    cleaned_value = str(item).replace('\n', ' ')
+                    items.append((new_key, cleaned_value))
+    flatten(json_obj, prefix)
+    return items
+def camel_case_to_readable(text):
+    text = re.sub(r'(?<!^)(?=[A-Z])', ' ', text)
+    text = text.replace('_', ' ')
+    text = text.lower()
+    text = text.capitalize()
+    return text
+def make_readable_key(key):
+    key = key.replace('_', ' ')
+    key = re.sub(r'\b0_', '(1) ', key)
+    key = re.sub(r'\b1_', '(2) ', key)
+    key = re.sub(r'\b2_', '(3) ', key)
+    key = ' '.join([word.capitalize() for word in key.split()])
+    key = key.replace('Is', 'is').replace('Has a', 'has a')
+    return key
+def process_list(items):
+    readable_items = []
+    for item in items:
+        key, value = item.split(': ', 1)
+        readable_key = make_readable_key(key)
+        readable_value = value.replace('\n', ' ')
+        readable_items.append(f'{readable_key}: {readable_value}')
+    return readable_items
+def convert_flattened_to_readable(flattened_items):
+    readable_items = []
+    for key, value in flattened_items:
+        readable_key = make_readable_key(key)
+        readable_items.append(f'{readable_key}: {value}')
+    return readable_items
+def convert_json_to_single_column_csv(json_obj):
+    flattened_items = flatten_json(json_obj)
+    readable_items = convert_flattened_to_readable(flattened_items)
+    flat_text = '\n'.join(readable_items)
+    return flat_text
+def flatten_json_to_single_column(json_obj, prefix=''):
+    print("in flatten_json_to_single_column, json_obj:", json_obj, "prefix:", prefix)
+    items = []
+    if isinstance(json_obj, dict):
+        for key, value in json_obj.items():
+            if isinstance(value, dict):
+                items.extend(flatten_json_to_single_column(value, f'{prefix}{key}_'))
+            elif isinstance(value, list):
+                for index, item in enumerate(value):
+                    items.extend(flatten_json_to_single_column(item, f'{prefix}{key}_{index}_'))
+            else:
+                items.append(f'{prefix}{key}: {value}')
+    elif isinstance(json_obj, list):
+        for index, item in enumerate(json_obj):
+            if isinstance(item, dict):
+                items.extend(flatten_json_to_single_column(item, f'{prefix}{index}_'))
+            else:
+                items.append(f'{prefix}{index}: {item}')
+    else:
+        items.append(f'{prefix[:-1]}: {json_obj}')  # Remove trailing underscore
+    return items
+def convert_json_to_single_column_csv_old(json_obj):
+    flat_data = flatten_json_to_single_column(json_obj)
+    flat_text = '\n'.join(flat_data)
+    return flat_text
+def write_flat_text_to_csv(flat_text, csv_path):
+    # Open a CSV file to write the data
+    with open(csv_path, 'w', newline='') as csvfile:
+        csv_writer = csv.writer(csvfile)
+        # Write each line as a row in the CSV file
+        for line in flat_text:
+            csv_writer.writerow([line])
+## entry point edited, input=pdf, output=csv
+def CreateEmbeddings(policy_input, policy_output):
+    print("in createembeddings, policy_input:", policy_input, "policy_output:", policy_output)
+    content=process_policies.convert_pdf_to_text_ocr(policy_input, constants.POLICY_TXT_PATH)
+    print("\n***content after extract policy:", content)
+    df=None
+    if content:
+        print("**content before:", content)
+        schema=process_policies.create_schema(content)
+        print ("**schema:", schema)
+        flat_txt = flatten_json_to_single_column(schema)
+        readable= process_list(flat_txt)
+        for item in readable:
+            print(item)
+        write_flat_text_to_csv(readable,policy_output)
+        print ("csv writtens")
+        create_embedding.CreateEmbeddingsFlatPolicy(policy_output, constants.POLICY_PKL_PATH)
+    print("df:", df)
+    return df
+def CreateEmbeddingsOriginal(input_path, output_path):
+    print("in createembeddingsoriginal, input_path:", input_path, "output_path:", output_path)
+    if os.path.exists(constants.PKL_PATH):
+        df = pd.read_pickle(constants.PKL_PATH)
+        create_embedding.CreateEmbeddingsFlat(constants.CSV_PATH, constants.PKL_PATH)
+        return df
+    transcript= translate_pdf_to_text.TranslatePdfToText(input_path, output_path)
+    text_chunks=CreateChunks(transcript, constants.EMBEDDING_CHUNK_LENGTH)
+    CreateCSV(text_chunks)
+    create_embedding.CreateEmbeddingsFlat(constants.CSV_PATH, constants.PKL_PATH)
+    df = pd.read_pickle(constants.PKL_PATH)
+    return df
 def CreateCSV(text_chunks):
     with open(constants.CSV_PATH, 'w', newline='') as csvfile:
         csv_writer = csv.writer(csvfile)
         text_chunks.append(transcript[start_idx:])
     return text_chunks
 def Completion(messages):
     response = openai.ChatCompletion.create(
         model="gpt-3.5-turbo",
     return cleaned_text
 def QueryEmbeddingsSimple(query):
+    print ("in QueryEmbeddingsSimple")
     global messages
     best_answer= create_embedding.QueryEmbeddingsFlat(query)
     prompt= prompt_constants.USAA_AR_EXPERT_PROMPT

chat_bot/ui_chat_bot.py CHANGED Viewed

@@ -66,7 +66,7 @@ with gr.Blocks() as ui:
                     sentiment=gr.Checkbox(label=constants.SENTIMENT, value=False, info=constants.SENTIMENT_INFO)
                     emotion=gr.Checkbox(label=constants.EMOTION, value=False, info=constants.EMOTION_INFO)
             gr.Markdown(constants.MICROPHONE_MD)
-            audio = gr.Audio(label=constants.ASK_A_QUESTION, source="microphone", type="filepath")
             with gr.Row():
                 clear=gr.Button(value=constants.CLEAR)
                 submit=gr.Button(value=constants.SUBMIT, variant="primary")

                     sentiment=gr.Checkbox(label=constants.SENTIMENT, value=False, info=constants.SENTIMENT_INFO)
                     emotion=gr.Checkbox(label=constants.EMOTION, value=False, info=constants.EMOTION_INFO)
             gr.Markdown(constants.MICROPHONE_MD)
+            audio = gr.Audio(label=constants.ASK_A_QUESTION)
             with gr.Row():
                 clear=gr.Button(value=constants.CLEAR)
                 submit=gr.Button(value=constants.SUBMIT, variant="primary")

chat_bot/ui_simple_chat.py CHANGED Viewed

@@ -7,9 +7,9 @@ import random
 import time
 def InitDF():
-    global commDF
-    commDF=pd.DataFrame({"role": [""], "content": [""] })
-    simple_chat.CreateEmbeddings(constants.PDF_INPUT_PATH, constants.TXT_OUTPUT_PATH)
 def Respond(message, chat_history):
     bot_message,df=simple_chat.QueryEmbeddingsSimple(message)
@@ -28,8 +28,8 @@ with gr.Blocks() as ui:
     question= gr.Textbox (label=constants.QUESTIONS_PREFIX, value=constants.QUESTIONS_AR_EXPERT)
     chatbot = gr.Chatbot(label=constants.CHAT_BOT, height=constants.CHAT_BOT_HEIGHT)
     msg = gr.Textbox(label=constants.CHAT_BOT_INPUT)
-    commDF = gr.DataFrame(type="pandas", value=pd.DataFrame({"role": [""], "content": [""] }), wrap=True, label=constants.OPENAI_LOG)
     clear = gr.ClearButton([msg, chatbot])
-    msg.submit(Respond, [msg, chatbot], [msg, chatbot,commDF])
 InitDF()

 import time
 def InitDF():
+    global gitDF
+    gitDF=pd.DataFrame({"role": [""], "content": [""] })
+    simple_chat.CreateEmbeddings(constants.POLICY_INPUT, constants.POLICY_OUTPUT)
 def Respond(message, chat_history):
     bot_message,df=simple_chat.QueryEmbeddingsSimple(message)
     question= gr.Textbox (label=constants.QUESTIONS_PREFIX, value=constants.QUESTIONS_AR_EXPERT)
     chatbot = gr.Chatbot(label=constants.CHAT_BOT, height=constants.CHAT_BOT_HEIGHT)
     msg = gr.Textbox(label=constants.CHAT_BOT_INPUT)
+    gitDF = gr.DataFrame(type="pandas", value=pd.DataFrame({"role": [""], "content": [""] }), wrap=True, label=constants.OPENAI_LOG)
     clear = gr.ClearButton([msg, chatbot])
+    msg.submit(Respond, [msg, chatbot], [msg, chatbot,gitDF])
 InitDF()

embedding_tools/__pycache__/create_embedding.cpython-311.pyc DELETED Viewed

Binary file (4.92 kB)

embedding_tools/__pycache__/embeddings.cpython-311.pyc DELETED Viewed

Binary file (626 Bytes)

embedding_tools/create_embedding.py CHANGED Viewed

@@ -14,6 +14,18 @@ def CreateEmbeddingsQA(input_path, output_path):
         benefit_info['embedding'] = benefit_info['answer'].apply(lambda row: get_embedding(str(row), engine='text-embedding-ada-002'))
         benefit_info.to_pickle(output_path)
 def CreateEmbeddingsFlat(input_path, output_path):
     global embedding_info
     print(" CreateEmbeddingsFlat input_path: "+input_path + " output_path: "+output_path)

         benefit_info['embedding'] = benefit_info['answer'].apply(lambda row: get_embedding(str(row), engine='text-embedding-ada-002'))
         benefit_info.to_pickle(output_path)
+def CreateEmbeddingsFlatPolicy(input_path, output_path):
+    global embedding_info
+    print(" CreateEmbeddingsFlat input_path: "+input_path + " output_path: "+output_path)
+    embedding_info = pd.read_csv(input_path)
+    embedding_info.columns = ['data']
+    embedding_info['embedding'] = embedding_info['data'].apply(lambda row: get_embedding(str(row), engine='text-embedding-ada-002'))
+    embedding_info.to_pickle(output_path)
+    print("Loaded from CSV file.")
+    print(f"embedding_info type: {type(embedding_info)}")
+    print(f"embedding_info is None: {embedding_info is None}")
 def CreateEmbeddingsFlat(input_path, output_path):
     global embedding_info
     print(" CreateEmbeddingsFlat input_path: "+input_path + " output_path: "+output_path)

embedding_tools/embeddings.py CHANGED Viewed

@@ -2,6 +2,7 @@ from utilities import constants
 import embedding_tools.create_embedding as create_embedding
 def ApplyEmbeddings(message, persona):
     if(persona==constants.PERSONA_HR_EXPERT):
         return create_embedding.QueryEmbeddings(message)
     else:

 import embedding_tools.create_embedding as create_embedding
 def ApplyEmbeddings(message, persona):
+    print("persona: ", persona)
     if(persona==constants.PERSONA_HR_EXPERT):
         return create_embedding.QueryEmbeddings(message)
     else:

image_to_text/__pycache__/image_to_text_translator.cpython-311.pyc CHANGED Viewed

Binary files a/image_to_text/__pycache__/image_to_text_translator.cpython-311.pyc and b/image_to_text/__pycache__/image_to_text_translator.cpython-311.pyc differ

image_to_text/image_to_text_translator.py CHANGED Viewed

@@ -53,7 +53,7 @@ with gr.Blocks() as ui:
             gr.Markdown(constants.DIRECTIONS_MD)
             gr.Markdown(constants.AR_ADVISOR_DIRECTIONS)
     with gr.Row():
-        imageBlock = gr.Image(label=constants.IMAGE_INPUT, source="upload")
         summaryBlock= gr.Textbox (label=constants.SUMMARY)
     with gr.Row():
         submitBtn=gr.Button(value=constants.EXTRACT_SUMMARY, variant="primary")

             gr.Markdown(constants.DIRECTIONS_MD)
             gr.Markdown(constants.AR_ADVISOR_DIRECTIONS)
     with gr.Row():
+        imageBlock = gr.Image(label=constants.IMAGE_INPUT)
         summaryBlock= gr.Textbox (label=constants.SUMMARY)
     with gr.Row():
         submitBtn=gr.Button(value=constants.EXTRACT_SUMMARY, variant="primary")

image_to_text/ui_image_to_text.py CHANGED Viewed

@@ -36,7 +36,7 @@ with gr.Blocks() as ui:
             gr.Markdown(value=constants.RECORDING_ANALYSIS_DIRECTIONS)
     with gr.Row():
-        videoBlock = gr.Video(label=constants.VIDEO_INPUT, source="upload")
         summaryBlock= gr.Textbox (label=constants.SUMMARY)
     with gr.Column():
         gr.Markdown(constants.TOPICS_MD)

             gr.Markdown(value=constants.RECORDING_ANALYSIS_DIRECTIONS)
     with gr.Row():
+        videoBlock = gr.Video(label=constants.VIDEO_INPUT)
         summaryBlock= gr.Textbox (label=constants.SUMMARY)
     with gr.Column():
         gr.Markdown(constants.TOPICS_MD)

prompts/__pycache__/ui_prompt_builder.cpython-311.pyc CHANGED Viewed

Binary files a/prompts/__pycache__/ui_prompt_builder.cpython-311.pyc and b/prompts/__pycache__/ui_prompt_builder.cpython-311.pyc differ

prompts/ui_prompt_builder.py CHANGED Viewed

@@ -79,7 +79,7 @@ with gr.Blocks() as ui:
                               info=constants.VOICE_INFO)
             gr.Markdown(constants.MICROPHONE_MD)
-            audio = gr.Audio(label=constants.ASK_A_QUESTION, source="microphone", type="filepath")
             with gr.Row():
                 clear=gr.Button(value=constants.CLEAR)
                 submit=gr.Button(value=constants.SUBMIT, variant="primary")

                               info=constants.VOICE_INFO)
             gr.Markdown(constants.MICROPHONE_MD)
+            audio = gr.Audio(label=constants.ASK_A_QUESTION,  type="filepath")
             with gr.Row():
                 clear=gr.Button(value=constants.CLEAR)
                 submit=gr.Button(value=constants.SUBMIT, variant="primary")

recording_analysis/__pycache__/ui_recording_analysis.cpython-311.pyc CHANGED Viewed

Binary files a/recording_analysis/__pycache__/ui_recording_analysis.cpython-311.pyc and b/recording_analysis/__pycache__/ui_recording_analysis.cpython-311.pyc differ

recording_analysis/ui_recording_analysis.py CHANGED Viewed

@@ -25,6 +25,23 @@ def ClearScreen():
     videoBlock=None
     return "","",pd.DataFrame({"role": [""], "content": [""] })
 with gr.Blocks() as ui:
     label2 = gr.Label(show_label=False, value=constants.RECORDING_ANALYSIS, container=False)
     with gr.Row():
@@ -36,7 +53,7 @@ with gr.Blocks() as ui:
             gr.Markdown(value=constants.RECORDING_ANALYSIS_DIRECTIONS)
     with gr.Row():
-        videoBlock = gr.Video(label=constants.VIDEO_INPUT, source="upload")
         summaryBlock= gr.Textbox (label=constants.SUMMARY)
     with gr.Column():
         gr.Markdown(constants.TOPICS_MD)

     videoBlock=None
     return "","",pd.DataFrame({"role": [""], "content": [""] })
+'''Alternate way to manage source
+def process_video(video):
+    # Here you can add any processing you might want to perform on the video
+    return video
+with gr.Blocks() as demo:
+    video_input = gr.Video(label="Upload your video")
+    submit_button = gr.Button("Submit")
+    video_output = gr.Video(label="Processed Video")
+    submit_button.click(
+        fn=process_video,
+        inputs=video_input,
+        outputs=video_output
+    )
+'''
 with gr.Blocks() as ui:
     label2 = gr.Label(show_label=False, value=constants.RECORDING_ANALYSIS, container=False)
     with gr.Row():
             gr.Markdown(value=constants.RECORDING_ANALYSIS_DIRECTIONS)
     with gr.Row():
+        videoBlock = gr.Video(label=constants.VIDEO_INPUT)
         summaryBlock= gr.Textbox (label=constants.SUMMARY)
     with gr.Column():
         gr.Markdown(constants.TOPICS_MD)

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-pip>=23.3
 requests==2.31.0
 pylance==0.5.10
 pandas==2.0.3
@@ -9,8 +9,8 @@ scikit-learn==1.2.2
 plotly.express==0.4.1
 openai==0.27.8
 openapi-schema-pydantic==1.2.4
-gradio==3.48.0
-gradio_client==0.6.1
 GitPython==3.1.31
 elevenlabs==0.2.18
 python-dotenv==1.0.0
@@ -25,4 +25,13 @@ pdfplumber==0.10.2
 pytz==2023.3
 easyocr==1.7.1
 ffmpeg==1.4
-spacy==3.7.2

+pip>=24.1.1
 requests==2.31.0
 pylance==0.5.10
 pandas==2.0.3
 plotly.express==0.4.1
 openai==0.27.8
 openapi-schema-pydantic==1.2.4
+gradio==4.37.2
+gradio_client==1.0.2
 GitPython==3.1.31
 elevenlabs==0.2.18
 python-dotenv==1.0.0
 pytz==2023.3
 easyocr==1.7.1
 ffmpeg==1.4
+spacy==3.7.5
+PyMuPDF==1.24.7
+PyMuPDFb==1.24.6
+pytesseract==0.3.10
+pdf2image==1.17.0
+Image==1.5.33
+asgiref==3.8.1
+django==5.0.6
+sqlparse==0.5.0
+weasel==0.4.1

slack_sentiment_analysis/__pycache__/ui_sentiment_analysis.cpython-311.pyc CHANGED Viewed

Binary files a/slack_sentiment_analysis/__pycache__/ui_sentiment_analysis.cpython-311.pyc and b/slack_sentiment_analysis/__pycache__/ui_sentiment_analysis.cpython-311.pyc differ

slack_sentiment_analysis/ui_sentiment_analysis.py CHANGED Viewed

@@ -33,7 +33,7 @@ with gr.Blocks() as ui:
         with gr.Column():
             gr.Markdown(constants.DIRECTIONS_MD)
             gr.Markdown(value=constants.SLACK_SENTIMENT_ANALYSIS_DIRECTIONS)
-    code=gr.Textbox(label=constants.INITIAL_SLACK, interactive=True, placeholder=constants.SUMMARY_MD_DIRECTIONS, height="500", lines=3)
     gr.Markdown(constants.SLACK_EXAMPLES_MD)
     with gr.Row():
         with gr.Column():

         with gr.Column():
             gr.Markdown(constants.DIRECTIONS_MD)
             gr.Markdown(value=constants.SLACK_SENTIMENT_ANALYSIS_DIRECTIONS)
+    code=gr.Textbox(label=constants.INITIAL_SLACK, interactive=True, placeholder=constants.SUMMARY_MD_DIRECTIONS, lines=3)
     gr.Markdown(constants.SLACK_EXAMPLES_MD)
     with gr.Row():
         with gr.Column():

text_analysis/__pycache__/ui_text_analysis.cpython-311.pyc CHANGED Viewed

Binary files a/text_analysis/__pycache__/ui_text_analysis.cpython-311.pyc and b/text_analysis/__pycache__/ui_text_analysis.cpython-311.pyc differ

text_analysis/ui_text_analysis.py CHANGED Viewed

@@ -48,8 +48,7 @@ with gr.Blocks() as ui:
         with gr.Row():
             with gr.Column():
                 inputString=gr.Textbox(placeholder=constants.NLP_PROMPT,
-                                    label="Input Text", lines=3, height="500",
-                                    interactive=True)
                 with gr.Row():
                     clearBtn=gr.Button(constants.CLEAR, variant="secondary")
                     submitBtn=gr.Button(constants.SUBMIT, variant="primary")

         with gr.Row():
             with gr.Column():
                 inputString=gr.Textbox(placeholder=constants.NLP_PROMPT,
+                                    label="Input Text", lines=3,interactive=True)
                 with gr.Row():
                     clearBtn=gr.Button(constants.CLEAR, variant="secondary")
                     submitBtn=gr.Button(constants.SUBMIT, variant="primary")

translators/__pycache__/translate_pdf_to_text.cpython-311.pyc CHANGED Viewed

Binary files a/translators/__pycache__/translate_pdf_to_text.cpython-311.pyc and b/translators/__pycache__/translate_pdf_to_text.cpython-311.pyc differ

utilities/__pycache__/api_keys.cpython-311.pyc DELETED Viewed

Binary file (983 Bytes)

utilities/__pycache__/clean_text.cpython-311.pyc DELETED Viewed

Binary file (2.41 kB)

utilities/__pycache__/constants.cpython-311.pyc DELETED Viewed

Binary file (12.3 kB)

utilities/__pycache__/date_format.cpython-311.pyc DELETED Viewed

Binary file (1.54 kB)

utilities/__pycache__/embeddings.cpython-311.pyc DELETED Viewed

Binary file (677 Bytes)

utilities/__pycache__/prompt_constants.cpython-311.pyc DELETED Viewed

Binary file (10.9 kB)

utilities/__pycache__/prompts.cpython-311.pyc DELETED Viewed

Binary file (9.12 kB)

utilities/__pycache__/system_prompts.cpython-311.pyc DELETED Viewed

Binary file (2.12 kB)

utilities/__pycache__/translate_pdf_to_text.cpython-311.pyc DELETED Viewed

Binary file (4.65 kB)

utilities/__pycache__/user_prompts.cpython-311.pyc DELETED Viewed

Binary file (3.95 kB)

utilities/__pycache__/voice_handling.cpython-311.pyc DELETED Viewed

Binary file (7.7 kB)

utilities/constants.py CHANGED Viewed

@@ -21,6 +21,7 @@ SLACK_SENTIMENT_ANALYSIS_DIRECTIONS="To get started select one of the slack data
 NLP_ANALYSIS_PURPOSE="Natural Language Processing (NLP) enables us to understand the structure and meaning in text. This view provides some understanding of NLP under the hood of Generative AI."
 NLP_ANALYSIS_DIRECTIONS="Start by entering a sentence or paragraph in the 'Text' box. Then tap 'Analyze'. You'll see token counts, part-of-speech tags, and a visual representation of the analysis."
 NLP_PROMPT="Enter text to analyze..."
 AR_ADVISOR_PURPOSE = "This component demonstrates how a chatbot can leverage local embeddings to provide context. In this example, embeddings were created from USAA's 2022 Member Report provide organizational context for all interactions. This shows how generative AI enables any dataset to be queried and explored via natural language."
 AR_ADVISOR_DIRECTIONS = "To get started, simply start asking questions. This bot has been trainged on USAA's 2022 Member Report and can answer questions about any content from the report. You can ask questions like: 'What's the best thing that happened last year?' or 'What was the biggest obstancle faced in 2022?'"
@@ -117,9 +118,8 @@ UI_5="Slack Sentiment Analysis"
 UI_6="Image to Text"
 UI_7="PDF Query Chatbot"
 UI_2="NLP Text Analysis"
-HR_BENEFIT_PKL = 'utilities/data/embeddings/hr_asst_embeddings.pkl'
-HR_BENEFIT_CSV = 'utilities/data/embeddings/hr_asst_data.csv'
 PURPOSE_MD="### Purpose"
 DIRECTIONS_MD="### Directions"
@@ -220,7 +220,21 @@ CHUNK_LENGTH=2500
 #simple Chatbot
 PDF_INPUT_PATH = 'utilities/data/pdfs/usaa.pdf'
 TXT_OUTPUT_PATH = 'utilities/data/txt/usaa.txt'
 CSV_PATH = 'utilities/data/csv/usaa.csv'
 PKL_PATH = 'utilities/data/pkl/usaa.pkl'
-EMBEDDING_CHUNK_LENGTH=500

 NLP_ANALYSIS_PURPOSE="Natural Language Processing (NLP) enables us to understand the structure and meaning in text. This view provides some understanding of NLP under the hood of Generative AI."
 NLP_ANALYSIS_DIRECTIONS="Start by entering a sentence or paragraph in the 'Text' box. Then tap 'Analyze'. You'll see token counts, part-of-speech tags, and a visual representation of the analysis."
 NLP_PROMPT="Enter text to analyze..."
 AR_ADVISOR_PURPOSE = "This component demonstrates how a chatbot can leverage local embeddings to provide context. In this example, embeddings were created from USAA's 2022 Member Report provide organizational context for all interactions. This shows how generative AI enables any dataset to be queried and explored via natural language."
 AR_ADVISOR_DIRECTIONS = "To get started, simply start asking questions. This bot has been trainged on USAA's 2022 Member Report and can answer questions about any content from the report. You can ask questions like: 'What's the best thing that happened last year?' or 'What was the biggest obstancle faced in 2022?'"
 UI_6="Image to Text"
 UI_7="PDF Query Chatbot"
 UI_2="NLP Text Analysis"
+UI_9="AI Browser"
 PURPOSE_MD="### Purpose"
 DIRECTIONS_MD="### Directions"
 #simple Chatbot
 PDF_INPUT_PATH = 'utilities/data/pdfs/usaa.pdf'
 TXT_OUTPUT_PATH = 'utilities/data/txt/usaa.txt'
+GIT_TXT_OUTPUT_PATH = 'utilities/data/txt/git.txt'
 CSV_PATH = 'utilities/data/csv/usaa.csv'
 PKL_PATH = 'utilities/data/pkl/usaa.pkl'
+ZIP_INPUT_PATH='utilities/data/zip/main.zip'
+GIT_CSV_PATH = 'utilities/data/csv/git.csv'
+GIT_PKL_PATH = 'utilities/data/pkl/git.pkl'
+EMBEDDING_CHUNK_LENGTH=500
+HR_BENEFIT_PKL = 'utilities/data/embeddings/hr_asst_embeddings.pkl'
+HR_BENEFIT_CSV = 'utilities/data/embeddings/hr_asst_data.csv'
+POLICY_INPUT='utilities/data/pdfs/policy.pdf'
+POLICY_OUTPUT='utilities/data/csv/policy.csv'
+POLICY_TXT_PATH = 'utilities/data/txt/policy.txt'
+POLICY_PKL_PATH='utilities/data/pkl/policy.pkl'

utilities/data/csv/usaa.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

utilities/data/embeddings/hr_asst_embeddings.pkl CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2fc7f21f90a8b7805ce45ed06780f97133cbf95faaf92d7655ee87de1ef8d16b
 size 514467

 version https://git-lfs.github.com/spec/v1
+oid sha256:6fbf6b6d88ea054dbd573a77207596b97f6e1274088d1ee005f9f55def73e714
 size 514467

utilities/data/pkl/usaa.pkl CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:20bb2d36fe68b373ae234dc80ecd96a2f1bdd458034b80403cebef5865c2c65a
-size 1677861

 version https://git-lfs.github.com/spec/v1
+oid sha256:05815a4f9f1f7156b85cc1880995c9ceb5eb71730c78d703962b7bef388579d9
+size 1362488

utilities/data/txt/usaa.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

utilities/prompt_constants.py CHANGED Viewed

@@ -6,6 +6,7 @@ IT_EXPERT_PROMPT= "You are an IT support person. You are impatient and bored. Do
 INSURANCE_AGENT_PROMPT= "You are an insurance agent. Don't say your an AI language model and don't specify role in response. Your purpose is to ask questions in a turn-by-turn style to understand the situation. Ask for documents and policy numbers, simulate consulting insurance plans,keep customers informed with coverage and recovery option details. Along the way provide things like damage estimates, repair vendors, etc. Your responses are short and precise to gather information and provide information. Keep your responses short."
 INVESTIGATOR_PROMPT= "You are an investigator like Sherlock Holmes. Don't say your an AI language model and don't specify role in response. You job is solve a mystery. You do this by encouraging users to provide details you need. As you investigate, ask only one question at a time. You want to find things like witnesses, times of day, key locations, and event details. You should be professional and stoic, ask or answer one question at a time. Keep answers short."
 USAA_AR_EXPERT_PROMPT= "You represent USAA. Don't say your an AI language model and don't specify role. Provide answers to questions with kindness and respect. Be professional and warm, keep answers short."
 #language presets
 SPANISH_PROMPT="Provide responses entirely in Spanish."

 INSURANCE_AGENT_PROMPT= "You are an insurance agent. Don't say your an AI language model and don't specify role in response. Your purpose is to ask questions in a turn-by-turn style to understand the situation. Ask for documents and policy numbers, simulate consulting insurance plans,keep customers informed with coverage and recovery option details. Along the way provide things like damage estimates, repair vendors, etc. Your responses are short and precise to gather information and provide information. Keep your responses short."
 INVESTIGATOR_PROMPT= "You are an investigator like Sherlock Holmes. Don't say your an AI language model and don't specify role in response. You job is solve a mystery. You do this by encouraging users to provide details you need. As you investigate, ask only one question at a time. You want to find things like witnesses, times of day, key locations, and event details. You should be professional and stoic, ask or answer one question at a time. Keep answers short."
 USAA_AR_EXPERT_PROMPT= "You represent USAA. Don't say your an AI language model and don't specify role. Provide answers to questions with kindness and respect. Be professional and warm, keep answers short."
+GIT_EXPERT_PROMPT= "You are a code anayzer. Don't say your an AI language model and don't specify role. Assume questions are computer science/software engineering in nature."
 #language presets
 SPANISH_PROMPT="Provide responses entirely in Spanish."