chrissoria commited on
Commit
a9678de
·
1 Parent(s): 09f46a9

Replace temp PDF paths with original filenames in results

Browse files
Files changed (1) hide show
  1. app.py +17 -0
app.py CHANGED
@@ -753,10 +753,13 @@ with col_input:
753
 
754
  if pdf_files:
755
  input_data = []
 
756
  for f in pdf_files:
757
  with tempfile.NamedTemporaryFile(delete=False, suffix='.pdf') as tmp:
758
  tmp.write(f.read())
759
  input_data.append(tmp.name)
 
 
760
  description = pdf_description or "document"
761
  original_filename = "pdf_files"
762
  st.success(f"Uploaded {len(pdf_files)} PDF file(s)")
@@ -1053,6 +1056,20 @@ with col_input:
1053
  # Combine results
1054
  result_df = pd.concat(all_results, ignore_index=True)
1055
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1056
  # Save CSV
1057
  with tempfile.NamedTemporaryFile(mode='w', suffix='_classified.csv', delete=False) as f:
1058
  result_df.to_csv(f.name, index=False)
 
753
 
754
  if pdf_files:
755
  input_data = []
756
+ pdf_name_map = {} # Map temp paths to original filenames
757
  for f in pdf_files:
758
  with tempfile.NamedTemporaryFile(delete=False, suffix='.pdf') as tmp:
759
  tmp.write(f.read())
760
  input_data.append(tmp.name)
761
+ pdf_name_map[tmp.name] = f.name.replace('.pdf', '') # Store original name without extension
762
+ st.session_state.pdf_name_map = pdf_name_map
763
  description = pdf_description or "document"
764
  original_filename = "pdf_files"
765
  st.success(f"Uploaded {len(pdf_files)} PDF file(s)")
 
1056
  # Combine results
1057
  result_df = pd.concat(all_results, ignore_index=True)
1058
 
1059
+ # For PDFs, replace temp file paths with original filenames
1060
+ if input_type_selected == "pdf" and 'pdf_input' in result_df.columns:
1061
+ pdf_name_map = st.session_state.get('pdf_name_map', {})
1062
+ def replace_temp_path(val):
1063
+ if pd.isna(val):
1064
+ return val
1065
+ val_str = str(val)
1066
+ for temp_path, orig_name in pdf_name_map.items():
1067
+ if temp_path in val_str:
1068
+ # Replace temp path with original name, keep page suffix
1069
+ return val_str.replace(temp_path, orig_name)
1070
+ return val_str
1071
+ result_df['pdf_input'] = result_df['pdf_input'].apply(replace_temp_path)
1072
+
1073
  # Save CSV
1074
  with tempfile.NamedTemporaryFile(mode='w', suffix='_classified.csv', delete=False) as f:
1075
  result_df.to_csv(f.name, index=False)