RAGDEV

Runtime error

App Files Files Community

alexkueck commited on Feb 9, 2024

Commit

623c3af

verified ·

1 Parent(s): e54927d

Update app.py

Browse files

Files changed (1) hide show

app.py +44 -12

app.py CHANGED Viewed

@@ -154,7 +154,16 @@ general_assistant_suche= openai_assistant_suche(client)
 def clear_all(history, uploaded_file_paths, chats):
     dic_history = {schluessel: wert for schluessel, wert in history}
     #später wird die summary auf 50 tokens verkürzt, um die Anfrage nicht so teuer werden zu lassen
     summary = "\n\n".join(f'{schluessel}: \n  {wert}' for schluessel, wert in dic_history.items())
     #falls file mit summay für download existiert hat: das zunächst löschen
     #cleanup(file_path_download)
@@ -162,9 +171,9 @@ def clear_all(history, uploaded_file_paths, chats):
     #den aktuellen Chatverlauf zum Download bereitstellen:
     if chats != {} :
         id_neu = len(chats)+1
-        chats[id_neu]=summary
     else:
-        chats[0]=summary
     #Eine Überschrift zu dem jeweiligen Chatverlauf finden - abhängig vom Inhalt
     #file_path_download = save_and_download(summary)
@@ -180,16 +189,39 @@ def clear_all(history, uploaded_file_paths, chats):
     else:
         file_path_download = "data/" + str(len(chats)) + "_" + result + ".pdf"
-    #summary in ein File laden
-    """
-    with open(file_path_download, 'w') as file:
-            # String in die Datei schreiben
-            file.write(summary)
-    """
     # Erzeuge einen Bytestream
     memoryFile = io.BytesIO()
     # Erstelle eine Canvas-Instanz im Bytestream
     c = canvas.Canvas(memoryFile, pagesize=letter)  #oder A4
     # Setze die Schriftart und -grösse
     c.setFont("Helvetica", 12)
     # Fülle die Canvas mit dem Inhalt der Textdatei
@@ -443,7 +475,7 @@ def generate_text_zu_bild(file, prompt, k, rag_option, chatbot, history, db):
 def generate_text_zu_doc(file, prompt, k, rag_option, chatbot, history, db):
     global splittet
     print("text mit doc ..............................")
     prompt_neu = generate_prompt_with_history(prompt, history)
     if (rag_option == "An"):
         print("Doc mit RAG..............................")
@@ -500,8 +532,8 @@ def generate_text (prompt, chatbot, history, rag_option, model_option, openai_ap
                 #oder an Hugging Face --------------------------
                 print("HF Anfrage.......................")
                 model_kwargs={"temperature": 0.5, "max_length": 512, "num_return_sequences": 1, "top_k": top_k, "top_p": top_p, "repetition_penalty": repetition_penalty}
-                llm = HuggingFaceHub(repo_id=repo_id, model_kwargs=model_kwargs)
-                #llm = HuggingFaceChain(model=MODEL_NAME_HF, model_kwargs={"temperature": 0.5, "max_length": 128})
                 #llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
                 #llm = HuggingFaceTextGenInference( inference_server_url="http://localhost:8010/", max_new_tokens=max_new_tokens,top_k=10,top_p=top_p,typical_p=0.95,temperature=temperature,repetition_penalty=repetition_penalty,)
                 #llm via HuggingChat
@@ -739,7 +771,7 @@ with gr.Blocks(css=custom_css(), theme=themeAlex) as demo:
                     with gr.Tab(label="Parameter"):
                         #gr.Markdown("# Parameters")
                         rag_option = gr.Radio(["Aus", "An"], label="LI Erweiterungen (RAG)", value = "Aus")
-                        model_option = gr.Radio(["OpenAI", "HuggingFace"], label="Modellauswahl", value = "OpenAI")
                         websuche = gr.Radio(["Aus", "An"], label="Web-Suche", value = "Aus")

 def clear_all(history, uploaded_file_paths, chats):
     dic_history = {schluessel: wert for schluessel, wert in history}
     #später wird die summary auf 50 tokens verkürzt, um die Anfrage nicht so teuer werden zu lassen
+    #summary wird gebraucht für die Anfrage beim NN, um eine Überschrift des Eintrages zu generieren
     summary = "\n\n".join(f'{schluessel}: \n  {wert}' for schluessel, wert in dic_history.items())
+    # um den Chatverlauf für das PDF vorzubereiten:
+    for key, value in dic_history.items():
+        if key == 'timestamp':
+            chat_history[key] = value
+        elif key == 'user':
+            chat_history[key] = value
+        elif key == 'assistant':
+            chat_history[key] = value
     #falls file mit summay für download existiert hat: das zunächst löschen
     #cleanup(file_path_download)
     #den aktuellen Chatverlauf zum Download bereitstellen:
     if chats != {} :
         id_neu = len(chats)+1
+        chats[id_neu]= summary
     else:
+        chats[0]= summary
     #Eine Überschrift zu dem jeweiligen Chatverlauf finden - abhängig vom Inhalt
     #file_path_download = save_and_download(summary)
     else:
         file_path_download = "data/" + str(len(chats)) + "_" + result + ".pdf"
+    #chat_history in ein File laden
     # Erzeuge einen Bytestream
     memoryFile = io.BytesIO()
     # Erstelle eine Canvas-Instanz im Bytestream
     c = canvas.Canvas(memoryFile, pagesize=letter)  #oder A4
+    #Inhalt des PDF formatieren:
+    # Schriftarten
+    TITLE_FONT = Font(Family="Times-Bold", Size=14)
+    TEXT_FONT = Font(Family="Courier", Size=12)
+    CODE_FONT = Font(Family="Monaco", Size=12)
+    # Breite und Höhe für Spalten
+    COLUMN_WIDTH = 150
+    ROW_HEIGHT = 20
+    # Bereiche für Spalten
+    TIMESTAMP_X = 50
+    USER_X = TIMESTAMP_X + COLUMN_WIDTH
+    ASSISTANT_X = USER_X + COLUMN_WIDTH
+    # Rand und Abstand zwischen Zeilen
+    MARGIN = 50
+    LINE_SPACING = 10
+    # Zeitstempel
+    c.setFillColorRGB(0, 0, 0)
+    c.setFont(TITLE_FONT)
+    c.drawCentredString(TIMESTAMP_X + COLUMN_WIDTH / 2, MARGIN, chat_history["timestamp"])
+    # User und Assistant
+    c.setFont(TEXT_FONT)
+    c.drawString(USER_X, MARGIN + LINE_SPACING, chat_history["user"] + ": ")
+    c.setFont(CODE_FONT)
+    c.drawString(USER_X + COLUMN_WIDTH, MARGIN + LINE_SPACING, chat_history["assistant"])
+    # Linie trennen
+    c.line(TIMESTAMP_X, MARGIN + LINE_SPACING + ROW_HEIGHT, ASSISTANT_X + COLUMN_WIDTH, MARGIN + LINE_SPACING + ROW_HEIGHT)
     # Setze die Schriftart und -grösse
     c.setFont("Helvetica", 12)
     # Fülle die Canvas mit dem Inhalt der Textdatei
 def generate_text_zu_doc(file, prompt, k, rag_option, chatbot, history, db):
     global splittet
     print("text mit doc ..............................")
     prompt_neu = generate_prompt_with_history(prompt, history)
     if (rag_option == "An"):
         print("Doc mit RAG..............................")
                 #oder an Hugging Face --------------------------
                 print("HF Anfrage.......................")
                 model_kwargs={"temperature": 0.5, "max_length": 512, "num_return_sequences": 1, "top_k": top_k, "top_p": top_p, "repetition_penalty": repetition_penalty}
+                #llm = HuggingFaceHub(repo_id=repo_id, model_kwargs=model_kwargs)
+                llm = HuggingFaceChain(model=MODEL_NAME_HF, model_kwargs={"temperature": 0.5, "max_length": 128})
                 #llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
                 #llm = HuggingFaceTextGenInference( inference_server_url="http://localhost:8010/", max_new_tokens=max_new_tokens,top_k=10,top_p=top_p,typical_p=0.95,temperature=temperature,repetition_penalty=repetition_penalty,)
                 #llm via HuggingChat
                     with gr.Tab(label="Parameter"):
                         #gr.Markdown("# Parameters")
                         rag_option = gr.Radio(["Aus", "An"], label="LI Erweiterungen (RAG)", value = "Aus")
+                        model_option = gr.Radio(["OpenAI", "HuggingFace"], label="Modellauswahl", value = "HuggingFace")
                         websuche = gr.Radio(["Aus", "An"], label="Web-Suche", value = "Aus")