Spaces:

RonsonChau
/

talicchatbot

Sleeping

App Files Files Community

RonsonChau commited on Feb 27, 2024

Commit

5e918fe

verified ·

1 Parent(s): 25605d2

initial commit

Browse files

Files changed (1) hide show

app.py +130 -0

app.py ADDED Viewed

	@@ -0,0 +1,130 @@

+import gradio as gr
+import random
+import time
+import openai
+import os
+openai.api_type = os.environ['OPENAI_API_TYPE']
+openai.api_key = os.environ['OPENAI_API_KEY']
+openai.api_base =  os.environ['OPENAI_API_BASE']
+openai.api_version = os.environ['OPENAI_API_VERSION']
+######################## Input TASK 1A  ########################
+from langchain.document_loaders import PyPDFLoader, OnlinePDFLoader
+from langchain.embeddings.sentence_transformer import SentenceTransformerEmbeddings
+from langchain.text_splitter import CharacterTextSplitter
+linkToPDF = os.environ['ONLINE_PDF_URL']
+loader = OnlinePDFLoader(linkToPDF)
+documents = loader.load()
+chuck_size = 1000
+chuck_overlap = 200
+text_splitter = CharacterTextSplitter(chunk_size=chuck_size, chunk_overlap=chuck_overlap)
+docs = text_splitter.split_documents(documents)
+###########################END OF TASK 1A ##################################
+######################## Input TASK 1B  ######3##############################
+from langchain.vectorstores import Chroma
+# create the open-source embedding function
+embedding_function = SentenceTransformerEmbeddings(model_name="all-MiniLM-L6-v2")
+# create simple ids - Index
+ids = [str(i) for i in range(1, len(docs) + 1)]
+# load it into Chroma
+db = Chroma.from_documents(docs, embedding_function, ids=ids, collection_metadata={"hnsw:space": "cosine"} )
+###########################END OF TASK 1B ##################################
+###########################INPUT OF TASK 3B ##################################
+# We try to limit the number of characters for the context
+contextCharsLimit = 3072
+promptStart = "Answer questions truthfully based on the information in sources provided below. \n If you cannot find the answer to a question based on the sources below, respond by saying “I apologize, but I am unable to provide an answer to your question, which is out of the scope of the document uploaded. Thank you! \n Sources:\n"
+# We try to construct a function which can return the system prompt based on user query and fit in context into system prompt
+def construct_system_prompt_chromadb (userQuery):
+  ### find the number of relevant documents
+  docs = db.similarity_search(userQuery)
+  context = []
+  ### append all relevant documents pagecontent into the context array
+  for match in docs:
+    context.append(match.page_content)
+  ### loop for the context, check if the chars of context > limit, if not insert the pagecontent into the prompt with "-" or "\n" separator
+  for i in range(1, len(context)):
+    if len("-".join(context[:i])) >= contextCharsLimit:
+      responsePrompt = promptStart + "-".join(context[:i-1])
+    elif i == len(context)-1:
+      responsePrompt = promptStart + "-".join(context)
+  ## return the response rpompt
+  return responsePrompt
+########################### END OF TASK 3B ##################################
+systemMessageContent = "" # System prompt we talked before - e.g., "You are a teaching assistant of a programming course CS1117. Try to answer student's question on python only"
+systemMessage = {"role": "system", "content": systemMessageContent}
+userMessageContent = "" # place holder
+chatbotMessageContent = ""  # place holder
+temperature = 0.8
+top_p = 0.95
+max_tokens = 800
+numOfHistory = 5 # Add in the number history windows here
+with gr.Blocks() as simpleChatDemo:
+    inputMessages = gr.State([systemMessage])
+#    inputMessages.append(systemMessage)
+    # Chatbot interface
+    chatbot = gr.Chatbot()
+    # Message is a Text Box
+    msg = gr.Textbox()
+    # Clear Button on to clear up the msg and chatbot
+    clear = gr.ClearButton([msg, chatbot])
+    def respond(userMessageInput, inputMessagesHistory, chatbot_history):
+        ## Construct the system message content based on the prompt function -- i.e., the input messages [0] will change based on system message now
+        systemMessageContent = construct_system_prompt_chromadb(userMessageInput) # Change the system content to the function
+        systemMessage = {"role": "system", "content": systemMessageContent}
+        inputMessagesHistory[0] = systemMessage
+        userMessageContent = userMessageInput
+        userMessage = {"role": "user", "content": userMessageContent}
+        inputMessagesHistory.append(userMessage)
+        if len(inputMessagesHistory)  > numOfHistory + 1:
+          numOutstandingMessages = len(inputMessagesHistory) - (numOfHistory + 1)
+          inputMessagesHistory = [inputMessagesHistory[0], *inputMessagesHistory[1+numOutstandingMessages :]]
+        print(inputMessages)
+        completion = openai.ChatCompletion.create(engine="chatgpt", messages=inputMessagesHistory, temperature=temperature, top_p = top_p, max_tokens = max_tokens)
+        chatbotMessageContent =  completion.choices[0].message.content
+        chatbotMessage = {"role": "assistant", "content": chatbotMessageContent }
+        inputMessagesHistory.append(chatbotMessage)
+        # chat history is main list of [(user message string, bot message string)]
+        chatbot_history.append((userMessageContent, chatbotMessageContent))
+        time.sleep(2)
+        # return with clear up the message box, and put the new messages into the chat_history
+        return "", inputMessagesHistory, chatbot_history,
+    # when the textbox click submit, i.e., enter, the function will be called (function, [input parameters], [output response])
+    msg.submit(respond, [msg, inputMessages, chatbot], [msg, inputMessages, chatbot])
+simpleChatDemo.launch(share=True)