yousbek commited on
Commit
aab9edf
·
verified ·
1 Parent(s): 798dc7e

Upload 8 files

Browse files
Files changed (2) hide show
  1. app/main.py +2 -1
  2. requirements.txt +0 -0
app/main.py CHANGED
@@ -5,6 +5,7 @@ from fastapi.staticfiles import StaticFiles
5
  import pytesseract
6
  from PIL import Image
7
  import PyPDF2
 
8
  from transformers import pipeline
9
  import docx
10
  import pandas as pd
@@ -34,7 +35,7 @@ def extract_text_from_pdf(file):
34
  from io import BytesIO
35
  pdf_file = BytesIO(file_content)
36
  # Passer l'objet fichier à PyPDF2
37
- reader = PyPDF2.PdfFileReader(pdf_file)
38
  text = ""
39
  for page_num in range(reader.numPages):
40
  text += reader.getPage(page_num).extract_text()
 
5
  import pytesseract
6
  from PIL import Image
7
  import PyPDF2
8
+ from PyPDF2 import PdfFileReader
9
  from transformers import pipeline
10
  import docx
11
  import pandas as pd
 
35
  from io import BytesIO
36
  pdf_file = BytesIO(file_content)
37
  # Passer l'objet fichier à PyPDF2
38
+ reader = PyPDF2.PdfReader(pdf_file)
39
  text = ""
40
  for page_num in range(reader.numPages):
41
  text += reader.getPage(page_num).extract_text()
requirements.txt CHANGED
Binary files a/requirements.txt and b/requirements.txt differ