Spaces:
Running
Running
Commit
·
a9678de
1
Parent(s):
09f46a9
Replace temp PDF paths with original filenames in results
Browse files
app.py
CHANGED
|
@@ -753,10 +753,13 @@ with col_input:
|
|
| 753 |
|
| 754 |
if pdf_files:
|
| 755 |
input_data = []
|
|
|
|
| 756 |
for f in pdf_files:
|
| 757 |
with tempfile.NamedTemporaryFile(delete=False, suffix='.pdf') as tmp:
|
| 758 |
tmp.write(f.read())
|
| 759 |
input_data.append(tmp.name)
|
|
|
|
|
|
|
| 760 |
description = pdf_description or "document"
|
| 761 |
original_filename = "pdf_files"
|
| 762 |
st.success(f"Uploaded {len(pdf_files)} PDF file(s)")
|
|
@@ -1053,6 +1056,20 @@ with col_input:
|
|
| 1053 |
# Combine results
|
| 1054 |
result_df = pd.concat(all_results, ignore_index=True)
|
| 1055 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1056 |
# Save CSV
|
| 1057 |
with tempfile.NamedTemporaryFile(mode='w', suffix='_classified.csv', delete=False) as f:
|
| 1058 |
result_df.to_csv(f.name, index=False)
|
|
|
|
| 753 |
|
| 754 |
if pdf_files:
|
| 755 |
input_data = []
|
| 756 |
+
pdf_name_map = {} # Map temp paths to original filenames
|
| 757 |
for f in pdf_files:
|
| 758 |
with tempfile.NamedTemporaryFile(delete=False, suffix='.pdf') as tmp:
|
| 759 |
tmp.write(f.read())
|
| 760 |
input_data.append(tmp.name)
|
| 761 |
+
pdf_name_map[tmp.name] = f.name.replace('.pdf', '') # Store original name without extension
|
| 762 |
+
st.session_state.pdf_name_map = pdf_name_map
|
| 763 |
description = pdf_description or "document"
|
| 764 |
original_filename = "pdf_files"
|
| 765 |
st.success(f"Uploaded {len(pdf_files)} PDF file(s)")
|
|
|
|
| 1056 |
# Combine results
|
| 1057 |
result_df = pd.concat(all_results, ignore_index=True)
|
| 1058 |
|
| 1059 |
+
# For PDFs, replace temp file paths with original filenames
|
| 1060 |
+
if input_type_selected == "pdf" and 'pdf_input' in result_df.columns:
|
| 1061 |
+
pdf_name_map = st.session_state.get('pdf_name_map', {})
|
| 1062 |
+
def replace_temp_path(val):
|
| 1063 |
+
if pd.isna(val):
|
| 1064 |
+
return val
|
| 1065 |
+
val_str = str(val)
|
| 1066 |
+
for temp_path, orig_name in pdf_name_map.items():
|
| 1067 |
+
if temp_path in val_str:
|
| 1068 |
+
# Replace temp path with original name, keep page suffix
|
| 1069 |
+
return val_str.replace(temp_path, orig_name)
|
| 1070 |
+
return val_str
|
| 1071 |
+
result_df['pdf_input'] = result_df['pdf_input'].apply(replace_temp_path)
|
| 1072 |
+
|
| 1073 |
# Save CSV
|
| 1074 |
with tempfile.NamedTemporaryFile(mode='w', suffix='_classified.csv', delete=False) as f:
|
| 1075 |
result_df.to_csv(f.name, index=False)
|