anhkhoiphan commited on
Commit
1be4594
·
1 Parent(s): cea056c

Thử giảm kích thước image

Browse files
Files changed (2) hide show
  1. data_processing.py +1 -1
  2. requirements.txt +2 -4
data_processing.py CHANGED
@@ -17,7 +17,7 @@ import docling
17
  from docling.document_converter import DocumentConverter, PdfFormatOption
18
  from docling.datamodel.base_models import InputFormat
19
  from docling.datamodel.pipeline_options import PdfPipelineOptions
20
- from docling.backend.pypdfium2_backend import PyPdfiumDocumentBackend
21
  import pandas as pd
22
  import gradio as gr
23
  from pymongo import MongoClient, UpdateOne
 
17
  from docling.document_converter import DocumentConverter, PdfFormatOption
18
  from docling.datamodel.base_models import InputFormat
19
  from docling.datamodel.pipeline_options import PdfPipelineOptions
20
+ # from docling.backend.pypdfium2_backend import PyPdfiumDocumentBackend
21
  import pandas as pd
22
  import gradio as gr
23
  from pymongo import MongoClient, UpdateOne
requirements.txt CHANGED
@@ -1,4 +1,4 @@
1
- torch
2
  transformers
3
  sentence-transformers
4
  FlagEmbedding
@@ -11,6 +11,4 @@ requests
11
  gradio
12
  python-dotenv
13
  docling
14
- pandas
15
- openpyxl
16
- pypdfium2
 
1
+ # torch
2
  transformers
3
  sentence-transformers
4
  FlagEmbedding
 
11
  gradio
12
  python-dotenv
13
  docling
14
+ openpyxl