Spaces:

mateoluksenberg
/

chat

Sleeping

App Files Files Community

mateoluksenberg commited on Aug 7, 2024

Commit

befd71c

verified ·

1 Parent(s): 340ee67

Update app.py

Browse files

Files changed (1) hide show

app.py +55 -50

app.py CHANGED Viewed

@@ -91,62 +91,62 @@ def extract_pptx(path):
     return text
-# def mode_load(path):
-#     choice = ""
-#     file_type = path.split(".")[-1]
-#     print(file_type)
-#     if file_type in ["pdf", "txt", "py", "docx", "pptx", "json", "cpp", "md"]:
-#         if file_type.endswith("pdf"):
-#             content = extract_pdf(path)
-#         elif file_type.endswith("docx"):
-#             content = extract_docx(path)
-#         elif file_type.endswith("pptx"):
-#             content = extract_pptx(path)
-#         else:
-#             content = extract_text(path)
-#         choice = "doc"
-#         print(content[:100])
-#         return choice, content[:5000]
-#     elif file_type in ["png", "jpg", "jpeg", "bmp", "tiff", "webp"]:
-#         content = Image.open(path).convert('RGB')
-#         choice = "image"
-#         return choice, content
-#     else:
-#         raise gr.Error("Oops, unsupported files.")
-def mode_load(file_obj):
-    try:
-        file_obj.seek(0)  # Asegúrate de que el puntero esté al inicio del archivo
-        # Detecta el tipo de archivo basándote en los primeros bytes si es posible
-        file_header = file_obj.read(4)
-        file_obj.seek(0)  # Vuelve al inicio del archivo para procesamiento completo
-        if file_header.startswith(b'%PDF'):
-            content = extract_pdf(file_obj)
-            choice = "doc"
-        elif file_obj.name.endswith(".docx"):
-            content = extract_docx(file_obj)
-            choice = "doc"
-        elif file_obj.name.endswith(".pptx"):
-            content = extract_pptx(file_obj)
-            choice = "doc"
-        elif file_obj.name.endswith(".txt") or file_obj.name.endswith(".py") or file_obj.name.endswith(".json") or file_obj.name.endswith(".cpp") or file_obj.name.endswith(".md"):
-            content = file_obj.read().decode('utf-8', errors='ignore')
-            choice = "doc"
-        elif file_obj.name.endswith((".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".webp")):
-            content = Image.open(file_obj).convert('RGB')
-            choice = "image"
-        else:
-            raise ValueError("Unsupported file type.")
-        return choice, content
-    except Exception as e:
-        raise ValueError(f"Error processing file: {str(e)}")
 @spaces.GPU()
@@ -324,6 +324,11 @@ def simple_chat(message: dict, temperature: float = 0.8, max_length: int = 4096,
                 conversation.append({"role": "user", "content": message['text']})
         input_ids = tokenizer.apply_chat_template(conversation, tokenize=True, add_generation_prompt=True, return_tensors="pt", return_dict=True).to(model.device)
         generate_kwargs = dict(
             max_length=max_length,

     return text
+def mode_load(path):
+    choice = ""
+    file_type = path.split(".")[-1]
+    print(file_type)
+    if file_type in ["pdf", "txt", "py", "docx", "pptx", "json", "cpp", "md"]:
+        if file_type.endswith("pdf"):
+            content = extract_pdf(path)
+        elif file_type.endswith("docx"):
+            content = extract_docx(path)
+        elif file_type.endswith("pptx"):
+            content = extract_pptx(path)
+        else:
+            content = extract_text(path)
+        choice = "doc"
+        print(content[:100])
+        return choice, content[:5000]
+    elif file_type in ["png", "jpg", "jpeg", "bmp", "tiff", "webp"]:
+        content = Image.open(path).convert('RGB')
+        choice = "image"
+        return choice, content
+    else:
+        raise gr.Error("Oops, unsupported files.")
+# def mode_load(file_obj):
+#     try:
+#         file_obj.seek(0)  # Asegúrate de que el puntero esté al inicio del archivo
+#         # Detecta el tipo de archivo basándote en los primeros bytes si es posible
+#         file_header = file_obj.read(4)
+#         file_obj.seek(0)  # Vuelve al inicio del archivo para procesamiento completo
+#         if file_header.startswith(b'%PDF'):
+#             content = extract_pdf(file_obj)
+#             choice = "doc"
+#         elif file_obj.name.endswith(".docx"):
+#             content = extract_docx(file_obj)
+#             choice = "doc"
+#         elif file_obj.name.endswith(".pptx"):
+#             content = extract_pptx(file_obj)
+#             choice = "doc"
+#         elif file_obj.name.endswith(".txt") or file_obj.name.endswith(".py") or file_obj.name.endswith(".json") or file_obj.name.endswith(".cpp") or file_obj.name.endswith(".md"):
+#             content = file_obj.read().decode('utf-8', errors='ignore')
+#             choice = "doc"
+#         elif file_obj.name.endswith((".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".webp")):
+#             content = Image.open(file_obj).convert('RGB')
+#             choice = "image"
+#         else:
+#             raise ValueError("Unsupported file type.")
+#         return choice, content
+#     except Exception as e:
+#         raise ValueError(f"Error processing file: {str(e)}")
 @spaces.GPU()
                 conversation.append({"role": "user", "content": message['text']})
         input_ids = tokenizer.apply_chat_template(conversation, tokenize=True, add_generation_prompt=True, return_tensors="pt", return_dict=True).to(model.device)
+        print("   ")
+        print("Conv: ")
+        print(conversation)
+        print("   ")
         generate_kwargs = dict(
             max_length=max_length,