Spaces:

FelipeErmeson
/

projeto-rag

Running on Zero

Felipe Silva commited on Sep 17

Commit

b9e4562

1 Parent(s): aa32ce9

Ajustando github

Files changed (2) hide show

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import spaces
 import torch
 import os
 from huggingface_hub import snapshot_download
-from utils import read_file_pdf, fix_type, extract_content_in_pdf, doc_converter, EXTENSIONS_FILES, EXTENSIONS_IMG_FILES
 from rag_utils import create_split_doc, store_docs, create_rag_chain
 import config
@@ -26,7 +26,7 @@ config.local_emb_path = snapshot_download(
 def process_file(file):
     if file is None:
-        return "Nenhum arquivo enviado."
     file_size = os.path.getsize(file)
     if file_size > MAX_FILE_SIZE:
@@ -34,7 +34,7 @@ def process_file(file):
     texto_extraido = doc_converter(file)
     if texto_extraido is None:
-        return "Não foi possível extrair o texto."
     return texto_extraido
@@ -54,7 +54,7 @@ def ask_question(texto_extraido, question):
     return resposta, docs_text
 def update_ask_button(extracted_text, question):
-    if extracted_text and question.strip():
         return gr.update(interactive=True)
     return gr.update(interactive=False)
@@ -63,7 +63,7 @@ def launch_app():
         gr.Markdown("# 🚀 Retrieval Augmented Generation - RAG")
         gr.Markdown("### ⚙️ Pergunte qualquer coisa para seu arquivo.")
         gr.Markdown(
-            "🐶 Faça o upload do seu arquivo e pergunte qualquer coisa a ele! Este código é open source e disponível [aqui](https://github.com/FelipeErmeson) no GitHub. 😁"
         )
         with gr.Row():

 import torch
 import os
 from huggingface_hub import snapshot_download
+from utils import read_file_pdf, fix_type, extract_content_in_pdf, doc_converter, EXTENSIONS_FILES, EXTENSIONS_IMG_FILES, MSG_NENHUM_ARQUIVO_ENVIADO, MSG_TEXTO_NAO_EXTRAIDO
 from rag_utils import create_split_doc, store_docs, create_rag_chain
 import config
 def process_file(file):
     if file is None:
+        return MSG_NENHUM_ARQUIVO_ENVIADO
     file_size = os.path.getsize(file)
     if file_size > MAX_FILE_SIZE:
     texto_extraido = doc_converter(file)
     if texto_extraido is None:
+        return MSG_TEXTO_NAO_EXTRAIDO
     return texto_extraido
     return resposta, docs_text
 def update_ask_button(extracted_text, question):
+    if extracted_text and MSG_NENHUM_ARQUIVO_ENVIADO not in extracted_text and MSG_TEXTO_NAO_EXTRAIDO not in extracted_text and question.strip():
         return gr.update(interactive=True)
     return gr.update(interactive=False)
         gr.Markdown("# 🚀 Retrieval Augmented Generation - RAG")
         gr.Markdown("### ⚙️ Pergunte qualquer coisa para seu arquivo.")
         gr.Markdown(
+            "🐶 Faça o upload do seu arquivo e pergunte qualquer coisa a ele! Este código é open source e disponível [aqui](https://github.com/FelipeErmeson/General-RAG) no GitHub. 😁"
         )
         with gr.Row():

utils.py CHANGED Viewed

@@ -8,6 +8,9 @@ EXTENSIONS_IMG_FILES = ['jpeg', 'jpg', 'png']
 EXTENSIONS_FILES = ['pdf']
 EXTENSIONS_ALLOWED = EXTENSIONS_IMG_FILES + EXTENSIONS_FILES
 # Max dimensions for processing
 MAX_IMAGE_SIZE = 2000  # pixels

 EXTENSIONS_FILES = ['pdf']
 EXTENSIONS_ALLOWED = EXTENSIONS_IMG_FILES + EXTENSIONS_FILES
+MSG_NENHUM_ARQUIVO_ENVIADO = 'Nenhum arquivo enviado.'
+MSG_TEXTO_NAO_EXTRAIDO = "Não foi possível extrair o texto."
 # Max dimensions for processing
 MAX_IMAGE_SIZE = 2000  # pixels