Spaces:

gerasdf
/

summarizer

Sleeping

App Files Files Community

gera commited on Apr 22, 2024

Commit

e46e576

1 Parent(s): 3a09f3c

added questions to first prompt to save money.

Browse files

Files changed (1) hide show

app.py +43 -22

app.py CHANGED Viewed

@@ -13,12 +13,18 @@ LIMIT = 125000 # some space for answer
 api_key = os_getenv("OPENAI_APIKEY")
 client = OpenAI(api_key=api_key)
 def get_prompt(books, question = None):
     prompt = (
         f"Read the following books.\n" +
         f"Each book may have some pages at the beggining with data about the book, an index, or table of content, etc. " +
         f"Pages may have a header and/or a footer. Consider all this maybe present." +
-        f"Please answer, for each book, all below in the suggested format, in the language of the book:\n"+
         f"**Title**: ...\n"
         f"**Author**: ...\n"
         f"**Chapter Names**: ...\n"
@@ -29,24 +35,37 @@ def get_prompt(books, question = None):
     return prompt
-def chat(message, history, files):
     history_openai_format = []
-    if len(history) == 0:
-        raise gr.Error("Primero hay que subir un libro")
-    if len(history) == 1:
-        if message:
-            raise gr.Error("First message must be empty")
-        message = history[0][0]
     else:
-        for human, assistant in history:
-            if human:
-                history_openai_format.append({"role": "user", "content": human })
-            if assistant:
-                history_openai_format.append({"role": "assistant", "content":assistant})
-    history_openai_format.append({"role": "user", "content": message})
     response = client.chat.completions.create(
         model=MODEL,
@@ -70,7 +89,7 @@ def get_text(filename):
         answer = open(filename).read()
     return answer
-def files_ready(filenames):
     encoder = encoding = tiktoken.encoding_for_model('gpt-4-turbo')
     books = ''
     for i, name in enumerate(filenames):
@@ -80,18 +99,20 @@ def files_ready(filenames):
     prompt = get_prompt(books)
     tokens = len(encoder.encode(prompt))
     cost = tokens * PRICE_PER_M / 1000000 * 2 # * 2 is too much for an answer
     if tokens > LIMIT:
         raise gr.Error(f"Book is too long. It's {tokens} tokens long and can't be more than {LIMIT}.")
-    return len(prompt), tokens, f"${cost}", [[prompt, None]]
-def files_changed(filenames):
     if filenames:
-        return "-", "-"
     else:
-        return 0, 0, "$0"
 with gr.Blocks(title="Book summarization and more") as demo:
     with gr.Row():
         files = gr.Files(file_types=["txt","doc","docx","pdf"] )
         with gr.Column():
@@ -102,12 +123,12 @@ with gr.Blocks(title="Book summarization and more") as demo:
     chat = gr.ChatInterface(
         fn=chat,
         title="Summarization and more",
-        additional_inputs=[files],
         multimodal=False)
     other = gr.Button(interactive=False)
-    files.upload(files_ready, [files], [letters, tokens, cost, chat.chatbot_state])
-    files.change(files_changed, files, [letters, tokens, cost])
 auth=os_getenv("APP_USERS", "null")

 api_key = os_getenv("OPENAI_APIKEY")
 client = OpenAI(api_key=api_key)
+def new_state():
+    return gr.State({
+        "prompt": "",
+    })
 def get_prompt(books, question = None):
     prompt = (
         f"Read the following books.\n" +
         f"Each book may have some pages at the beggining with data about the book, an index, or table of content, etc. " +
         f"Pages may have a header and/or a footer. Consider all this maybe present." +
+        f"For each book, please answer, all below in the suggested format and also answer all the questions at the end in detail, if present.\n"
+        f"Answer in the language of the book:\n"+
         f"**Title**: ...\n"
         f"**Author**: ...\n"
         f"**Chapter Names**: ...\n"
     return prompt
+def chat(message, history, files, state):
     history_openai_format = []
+    prompt    = state["prompt"]
+    if not message:
+        if len(history) > 0:
+            gr.Error("You sent an empty question. It's expensive, don't do it")
+            return ''
+    if not prompt:
+        gr.Error("First upload a book")
+        return ''
+    if (not history) and message:
+        prompt += f"**Questions**:{message}"
+        state["prompt"] = prompt
+    if history:
+        history[0] = (prompt, history[0][1])
     else:
+        message = prompt
+    for human, assistant in history:
+        if human:
+            history_openai_format.append({"role": "user", "content": human })
+        if assistant:
+            history_openai_format.append({"role": "assistant", "content":assistant})
+    if message:
+        history_openai_format.append({"role": "user", "content": message})
     response = client.chat.completions.create(
         model=MODEL,
         answer = open(filename).read()
     return answer
+def files_ready(filenames, state):
     encoder = encoding = tiktoken.encoding_for_model('gpt-4-turbo')
     books = ''
     for i, name in enumerate(filenames):
     prompt = get_prompt(books)
     tokens = len(encoder.encode(prompt))
     cost = tokens * PRICE_PER_M / 1000000 * 2 # * 2 is too much for an answer
+    state["prompt"] = prompt
     if tokens > LIMIT:
         raise gr.Error(f"Book is too long. It's {tokens} tokens long and can't be more than {LIMIT}.")
+    return len(prompt), tokens, f"${cost}", state
+def files_changed(filenames, state):
     if filenames:
+        return "-", "-", "-", state
     else:
+        return 0, 0, "$0", new_state()
 with gr.Blocks(title="Book summarization and more") as demo:
+    state = new_state()
     with gr.Row():
         files = gr.Files(file_types=["txt","doc","docx","pdf"] )
         with gr.Column():
     chat = gr.ChatInterface(
         fn=chat,
         title="Summarization and more",
+        additional_inputs=[files, state],
         multimodal=False)
     other = gr.Button(interactive=False)
+    files.upload(files_ready, [files, state], [letters, tokens, cost, state])
+    files.change(files_changed, [files, state], [letters, tokens, cost, state])
 auth=os_getenv("APP_USERS", "null")