Spaces:

danieldager
/

rag-llm

Runtime error

App Files Files Community

danieldager commited on Jul 5, 2024

Commit

b28439c

verified ·

1 Parent(s): b5f0bd1

Update app.py

Browse files

Files changed (1) hide show

app.py +200 -49

app.py CHANGED Viewed

@@ -1,63 +1,214 @@
-import gradio as gr
-from huggingface_hub import InferenceClient
 """
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-):
-    messages = [{"role": "system", "content": system_message}]
-    for val in history:
-        if val[0]:
-            messages.append({"role": "user", "content": val[0]})
-        if val[1]:
-            messages.append({"role": "assistant", "content": val[1]})
-    messages.append({"role": "user", "content": message})
-    response = ""
-    for message in client.chat_completion(
-        messages,
-        max_tokens=max_tokens,
-        stream=True,
-        temperature=temperature,
-        top_p=top_p,
-    ):
-        token = message.choices[0].delta.content
-        response += token
-        yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)",
-        ),
-    ],
 )
-if __name__ == "__main__":
-    demo.launch()

+"""
+This code uses the PyMuPDF package.
+PyMuPDF is AGPL licensed, please refer to:
+https://pymupdf.readthedocs.io/en/latest/about.html#license-and-copyright
+https://github.com/pymupdf/RAG
+https://medium.com/@pymupdf/building-a-rag-chatbot-gui-with-the-chatgpt-api-and-pymupdf-9ea8c7fc4ab5
 """
 """
+Code below is based on an implementation by Sunil Kumar Dash:
+MIT License
+Copyright (c) 2023 Sunil Kumar Dash
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+"""
+import os, re
+import pymupdf
+import gradio as gr
+from PIL import Image
+from typing import Any
+from dotenv import load_dotenv
+from langchain_openai import ChatOpenAI
+from langchain_openai import OpenAIEmbeddings
+from langchain_community.vectorstores import Chroma
+from langchain.chains import ConversationalRetrievalChain
+from langchain_community.document_loaders import PyMuPDFLoader
+load_dotenv()
+OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
+enable_box = gr.Textbox(
+    value=None, placeholder="Upload your OpenAI API key", interactive=True
 )
+disable_box = gr.Textbox(value="OpenAI API key is set", interactive=False)
+def set_apikey(api_key: str):
+    print("API Key set")
+    app.OPENAI_API_KEY = api_key
+    return disable_box
+def enable_api_box():
+    return enable_box
+def add_text(history, text: str):
+    if not text:
+        raise gr.Error("enter text")
+    history = history + [(text, "")]
+    return history
+class my_app:
+    def __init__(self, OPENAI_API_KEY: str = None) -> None:
+        self.OPENAI_API_KEY: str = OPENAI_API_KEY
+        self.chain = None
+        self.chat_history: list = []
+        self.N: int = 0
+        self.count: int = 0
+    def __call__(self, file: str) -> Any:
+        if self.count == 0:
+            self.chain = self.build_chain(file)
+            self.count += 1
+        return self.chain
+    def process_file(self, file: str):
+        loader = PyMuPDFLoader(file.name)
+        documents = loader.load()
+        pattern = r"/([^/]+)$"
+        match = re.search(pattern, file.name)
+        try:
+            file_name = match.group(1)
+        except:
+            file_name = os.path.basename(file)
+        return documents, file_name
+    def build_chain(self, file: str):
+        documents, file_name = self.process_file(file)
+        # Load embeddings model
+        embeddings = OpenAIEmbeddings(openai_api_key=self.OPENAI_API_KEY)
+        pdfsearch = Chroma.from_documents(
+            documents,
+            embeddings,
+            collection_name=file_name,
+        )
+        chain = ConversationalRetrievalChain.from_llm(
+            ChatOpenAI(temperature=0.0, openai_api_key=self.OPENAI_API_KEY),
+            retriever=pdfsearch.as_retriever(search_kwargs={"k": 1}),
+            return_source_documents=True,
+        )
+        return chain
+def get_response(history, query, file):
+    if not file:
+        raise gr.Error(message="Upload a PDF")
+    chain = app(file)
+    result = chain(
+        {"question": query, "chat_history": app.chat_history}, return_only_outputs=True
+    )
+    app.chat_history += [(query, result["answer"])]
+    app.N = list(result["source_documents"][0])[1][1]["page"]
+    for char in result["answer"]:
+        history[-1][-1] += char
+        yield history, ""
+def render_file(file):
+    doc = pymupdf.open(file.name)
+    page = doc[app.N]
+    # Render the page as a PNG image with a resolution of 150 DPI
+    pix = page.get_pixmap(dpi=150)
+    image = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
+    return image
+def purge_chat_and_render_first(file):
+    print("purge_chat_and_render_first")
+    # Purges the previous chat session so that the bot has no concept of previous documents
+    app.chat_history = []
+    app.count = 0
+    # Use PyMuPDF to render the first page of the uploaded document
+    doc = pymupdf.open(file.name)
+    page = doc[0]
+    # Render the page as a PNG image with a resolution of 150 DPI
+    pix = page.get_pixmap(dpi=150)
+    image = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
+    return image, []
+app = my_app()
+with gr.Blocks() as demo:
+    with gr.Column():
+        with gr.Row():
+            with gr.Column(scale=1):
+                api_key = gr.Textbox(
+                    placeholder="Enter OpenAI API key and hit <RETURN>",
+                    show_label=False,
+                    interactive=True
+                )
+        with gr.Row():
+            with gr.Column(scale=2):
+                with gr.Row():
+                    chatbot = gr.Chatbot(value=[], elem_id="chatbot")
+                with gr.Row():
+                    txt = gr.Textbox(
+                        show_label=False,
+                        placeholder="Enter text and press submit",
+                        scale=2
+                    )
+                    submit_btn = gr.Button("submit", scale=1)
+            with gr.Column(scale=1):
+                with gr.Row():
+                    show_img = gr.Image(label="Upload PDF")
+                with gr.Row():
+                    btn = gr.UploadButton("📁 upload a PDF", file_types=[".pdf"])
+    api_key.submit(
+        fn=set_apikey,
+        inputs=[api_key],
+        outputs=[
+            api_key,
+        ],
+    )
+    btn.upload(
+        fn=purge_chat_and_render_first,
+        inputs=[btn],
+        outputs=[show_img, chatbot],
+    )
+    submit_btn.click(
+        fn=add_text,
+        inputs=[chatbot, txt],
+        outputs=[
+            chatbot,
+        ],
+        queue=False,
+    ).success(
+        fn=get_response, inputs=[chatbot, txt, btn], outputs=[chatbot, txt]
+    ).success(
+        fn=render_file, inputs=[btn], outputs=[show_img]
+    )
+demo.queue()
+demo.launch()