Spaces:
Runtime error
Runtime error
Commit ·
c8c1181
1
Parent(s): a2537f9
Update app.py
Browse files
app.py
CHANGED
|
@@ -13,11 +13,9 @@ from pathlib import Path
|
|
| 13 |
import pytesseract
|
| 14 |
from pdf2image import convert_from_path
|
| 15 |
from PIL import Image
|
|
|
|
| 16 |
|
| 17 |
-
|
| 18 |
-
|
| 19 |
-
#pytesseract.pytesseract.tesseract_cmd = r"./lib/Tesseract-OCR/tesseract.exe"
|
| 20 |
-
#path_to_poppler_exe = r"./lib/poppler-0.68.0/bin"
|
| 21 |
|
| 22 |
def ocrtotext(filename):
|
| 23 |
# Almacena todas las páginas del PDF en una variable
|
|
@@ -26,7 +24,6 @@ def ocrtotext(filename):
|
|
| 26 |
text_file = (f'{filename}.txt') # Nombre del archivo de texto de salida
|
| 27 |
|
| 28 |
# Parte #1: Convirtiendo el PDF a imágenes
|
| 29 |
-
#pdf_pages = convert_from_path(PDF_file, 300, poppler_path=path_to_poppler_exe)
|
| 30 |
pdf_pages = convert_from_path(PDF_file, 300)
|
| 31 |
# Lee el archivo PDF a 300 DPI
|
| 32 |
|
|
@@ -124,7 +121,13 @@ def predict(file):
|
|
| 124 |
if chunks2[i] not in chunks_removable2 or model.predict([chunks2[i]]).item() == 1:
|
| 125 |
recorte_final += chunks2[i] + " "
|
| 126 |
print(100, '%')
|
| 127 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 128 |
|
| 129 |
# Crear una interfaz Gradio
|
| 130 |
iface = gr.Interface(
|
|
|
|
| 13 |
import pytesseract
|
| 14 |
from pdf2image import convert_from_path
|
| 15 |
from PIL import Image
|
| 16 |
+
from gradio_client import Client
|
| 17 |
|
| 18 |
+
client = Client("https://e564a63b1e689a45ef.gradio.live/")
|
|
|
|
|
|
|
|
|
|
| 19 |
|
| 20 |
def ocrtotext(filename):
|
| 21 |
# Almacena todas las páginas del PDF en una variable
|
|
|
|
| 24 |
text_file = (f'{filename}.txt') # Nombre del archivo de texto de salida
|
| 25 |
|
| 26 |
# Parte #1: Convirtiendo el PDF a imágenes
|
|
|
|
| 27 |
pdf_pages = convert_from_path(PDF_file, 300)
|
| 28 |
# Lee el archivo PDF a 300 DPI
|
| 29 |
|
|
|
|
| 121 |
if chunks2[i] not in chunks_removable2 or model.predict([chunks2[i]]).item() == 1:
|
| 122 |
recorte_final += chunks2[i] + " "
|
| 123 |
print(100, '%')
|
| 124 |
+
|
| 125 |
+
result = client.predict(
|
| 126 |
+
recorte_final, # str in 'text' Textbox component
|
| 127 |
+
api_name="/predict"
|
| 128 |
+
)
|
| 129 |
+
return result
|
| 130 |
+
|
| 131 |
|
| 132 |
# Crear una interfaz Gradio
|
| 133 |
iface = gr.Interface(
|