Spaces:

DaniFera
/

PDFree

Sleeping

App Files Files Community

DaniFera commited on Jan 16

Commit

6c7cf36

verified ·

1 Parent(s): 25d0b92

Update core.py

Browse files

Files changed (1) hide show

core.py +118 -30

core.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Versión 1.8: Core Completo con Compresión Ghostscript
 # Autor: Gemini (AI Assistant)
 # Descripción: Motor lógico de manipulación de PDFs. Independiente de la interfaz gráfica.
@@ -6,6 +6,8 @@ import os
 import zipfile
 import uuid
 import subprocess
 from pypdf import PdfWriter, PdfReader
 from pdf2image import convert_from_path
 from pdf2docx import Converter
@@ -134,7 +136,7 @@ class PDFEngine:
                 except ValueError: continue
         return sorted(list(set(key_pages)))
-    # --- FUNCIONALIDADES CORE ---
     def merge_pdfs(self, file_paths: list, order_indices: list = None) -> str:
         """Une múltiples PDFs respetando el orden indicado."""
@@ -201,15 +203,45 @@ class PDFEngine:
         return zip_path
     def compress_pdf(self, file_path: str, power: int = 2) -> str:
         """
         Comprime PDF usando Ghostscript.
         power:
-            0: /default (casi nada)
-            1: /prepress (alta calidad, poco tamaño)
-            2: /printer (calidad media-alta)
-            3: /ebook (calidad media, buena compresión - RECOMENDADO)
-            4: /screen (calidad baja, máxima compresión 72dpi)
         """
         if not file_path: raise ValueError("Falta archivo.")
@@ -284,6 +316,32 @@ class PDFEngine:
         except Exception as e:
             raise RuntimeError(f"Error al rotar: {e}")
     # --- CONVERSIONES ---
     def pdf_to_images_zip(self, file_path: str) -> str:
@@ -372,28 +430,58 @@ class PDFEngine:
         except Exception as e:
             raise RuntimeError(f"Error extrayendo texto: {e}")
-    def update_metadata(self, file_path: str, title: str, author: str, subject: str) -> str:
-        """Actualiza título, autor y asunto."""
-        if not file_path: raise ValueError("Falta archivo.")
         try:
-            reader = PdfReader(file_path)
-            writer = PdfWriter()
-            for page in reader.pages:
-                writer.add_page(page)
-            new_meta = {
-                "/Title": title,
-                "/Author": author,
-                "/Subject": subject,
-                "/Producer": "OpenPDF Tools (Libre)"
-            }
-            writer.add_metadata(new_meta)
-            output_path = self._get_output_path("editado_meta.pdf")
-            with open(output_path, "wb") as f:
-                writer.write(f)
-            return output_path
         except Exception as e:
-            raise RuntimeError(f"Error actualizando metadatos: {e}")

+# Versión 1.9: Core Completo (Todas las herramientas integradas)
 # Autor: Gemini (AI Assistant)
 # Descripción: Motor lógico de manipulación de PDFs. Independiente de la interfaz gráfica.
 import zipfile
 import uuid
 import subprocess
+import cv2
+import numpy as np
 from pypdf import PdfWriter, PdfReader
 from pdf2image import convert_from_path
 from pdf2docx import Converter
                 except ValueError: continue
         return sorted(list(set(key_pages)))
+    # --- FUNCIONALIDADES DE GESTIÓN DE PÁGINAS ---
     def merge_pdfs(self, file_paths: list, order_indices: list = None) -> str:
         """Une múltiples PDFs respetando el orden indicado."""
         return zip_path
+    def reorder_pages(self, file_path: str, order_str: str) -> str:
+        """
+        Crea un nuevo PDF con las páginas en el orden especificado.
+        order_str ejemplo: "3, 1, 2, 4-6"
+        """
+        if not file_path: raise ValueError("Falta archivo.")
+        reader = PdfReader(file_path)
+        total_pages = len(reader.pages)
+        # Reutilizamos el parser de rangos para obtener la lista de índices
+        groups = self._parse_range_groups(order_str, total_pages)
+        if not groups: raise ValueError("Orden inválido.")
+        flat_indices = []
+        for g in groups:
+            flat_indices.extend(g["indices"])
+        writer = PdfWriter()
+        for idx in flat_indices:
+            writer.add_page(reader.pages[idx])
+        output_path = self._get_output_path("reordenado.pdf")
+        with open(output_path, "wb") as f:
+            writer.write(f)
+        return output_path
+    # --- EDICIÓN Y SEGURIDAD ---
     def compress_pdf(self, file_path: str, power: int = 2) -> str:
         """
         Comprime PDF usando Ghostscript.
         power:
+            0: /default
+            1: /prepress
+            2: /printer
+            3: /ebook (Recomendado)
+            4: /screen
         """
         if not file_path: raise ValueError("Falta archivo.")
         except Exception as e:
             raise RuntimeError(f"Error al rotar: {e}")
+    def update_metadata(self, file_path: str, title: str, author: str, subject: str) -> str:
+        """Actualiza título, autor y asunto."""
+        if not file_path: raise ValueError("Falta archivo.")
+        try:
+            reader = PdfReader(file_path)
+            writer = PdfWriter()
+            for page in reader.pages:
+                writer.add_page(page)
+            new_meta = {
+                "/Title": title,
+                "/Author": author,
+                "/Subject": subject,
+                "/Producer": "OpenPDF Tools (Libre)"
+            }
+            writer.add_metadata(new_meta)
+            output_path = self._get_output_path("editado_meta.pdf")
+            with open(output_path, "wb") as f:
+                writer.write(f)
+            return output_path
+        except Exception as e:
+            raise RuntimeError(f"Error actualizando metadatos: {e}")
     # --- CONVERSIONES ---
     def pdf_to_images_zip(self, file_path: str) -> str:
         except Exception as e:
             raise RuntimeError(f"Error extrayendo texto: {e}")
+    # --- ANÁLISIS Y COMPARACIÓN ---
+    def compare_pdfs_visual(self, path_a: str, path_b: str) -> str:
+        """
+        Compara visualmente dos PDFs página por página y resalta diferencias.
+        Devuelve un PDF compuesto por imágenes de las diferencias.
+        """
+        if not path_a or not path_b: raise ValueError("Se requieren dos archivos.")
         try:
+            imgs_a = convert_from_path(path_a, dpi=100)
+            imgs_b = convert_from_path(path_b, dpi=100)
         except Exception as e:
+            raise RuntimeError(f"Error leyendo PDFs para comparar: {e}")
+        min_pages = min(len(imgs_a), len(imgs_b))
+        diff_pages = []
+        for i in range(min_pages):
+            # Convertir PIL a Numpy Array (RGB)
+            arr_a = np.array(imgs_a[i])
+            arr_b = np.array(imgs_b[i])
+            # Asegurar mismo tamaño
+            if arr_a.shape != arr_b.shape:
+                h, w = arr_a.shape[:2]
+                arr_b = cv2.resize(arr_b, (w, h))
+            # Calcular diferencia
+            gray_a = cv2.cvtColor(arr_a, cv2.COLOR_RGB2GRAY)
+            gray_b = cv2.cvtColor(arr_b, cv2.COLOR_RGB2GRAY)
+            diff = cv2.absdiff(gray_a, gray_b)
+            _, thresh = cv2.threshold(diff, 30, 255, cv2.THRESH_BINARY)
+            contours, _ = cv2.findContours(thresh, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
+            result_img = arr_a.copy()
+            for cnt in contours:
+                x, y, w, h = cv2.boundingRect(cnt)
+                cv2.rectangle(result_img, (x, y), (x + w, y + h), (255, 0, 255), 2)
+            diff_pages.append(Image.fromarray(result_img))
+        if not diff_pages:
+            raise ValueError("No se pudieron generar páginas de comparación o no hay páginas comunes.")
+        output_path = self._get_output_path("comparativa_diferencias.pdf")
+        diff_pages[0].save(
+            output_path, "PDF",
+            resolution=100.0,
+            save_all=True,
+            append_images=diff_pages[1:]
+        )
+        return output_path