Aqdas commited on
Commit
3bc760b
·
verified ·
1 Parent(s): 1a7455e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +21 -21
app.py CHANGED
@@ -26,26 +26,26 @@ st.title("Gen AI Invoice Extraction")
26
  uploaded_files = st.file_uploader("Choose PDF files", accept_multiple_files=True, type="pdf")
27
  if uploaded_files:
28
  # st.write(f'This is {uploaded_files}')
29
-
30
- for pdf_path in uploaded_files:
31
- convert_image = pdf_to_image(pdf_path)
32
- convert_image.save_image(f'{pdf_path}image')
33
- print('one_pdf_converted')
34
-
35
- all_images = glob.glob(os.path.join(folder_name, '*.jpg'))
36
- all_texts = []
37
- for image_path in all_images:
38
- text = image_to_text(image_path)
39
- all_texts.append(text)
40
- print('one text appended')
 
 
 
 
 
 
 
 
41
 
42
- empty_df = pd.DataFrame()
43
 
44
- for text in all_texts:
45
- extracted_text = extractor(text)
46
- task_details_dict = extracted_text.dict()
47
- df = pd.DataFrame([task_details_dict])
48
- empty_df = pd.concat([empty_df, df])
49
-
50
-
51
- empty_df.to_csv('extracted_data.csv')
 
26
  uploaded_files = st.file_uploader("Choose PDF files", accept_multiple_files=True, type="pdf")
27
  if uploaded_files:
28
  # st.write(f'This is {uploaded_files}')
29
+ if st.button('Extract'):
30
+ for pdf_path in uploaded_files:
31
+ convert_image = pdf_to_image(pdf_path)
32
+ convert_image.save_image(f'{pdf_path}image')
33
+ print('one_pdf_converted')
34
+
35
+ all_images = glob.glob(os.path.join(folder_name, '*.jpg'))
36
+ all_texts = []
37
+ for image_path in all_images:
38
+ text = image_to_text(image_path)
39
+ all_texts.append(text)
40
+ print('one text appended')
41
+
42
+ empty_df = pd.DataFrame()
43
+
44
+ for text in all_texts:
45
+ extracted_text = extractor(text)
46
+ task_details_dict = extracted_text.dict()
47
+ df = pd.DataFrame([task_details_dict])
48
+ empty_df = pd.concat([empty_df, df])
49
 
 
50
 
51
+ empty_df.to_csv('extracted_data.csv')