Spaces:
Sleeping
Sleeping
File size: 8,100 Bytes
099275d 26632cd 1510e20 099275d 1510e20 9c87ed0 099275d 9c87ed0 1ab2895 9c87ed0 1ab2895 099275d 883e33e 099275d 883e33e 099275d 883e33e 099275d 883e33e 099275d 6ceb267 1510e20 099275d 1510e20 099275d 6ceb267 1510e20 099275d 6ceb267 1510e20 099275d 1510e20 099275d c1e25dc 099275d 1510e20 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 |
import gradio as gr
import os
import json
from utils import (
get_salesforce_client, get_salesforce_objects, get_object_fields,
extract_text_from_pdf, extract_key_value_pairs, map_fields,
create_record, attach_pdf, log_failure
)
# Ensure uploads directory exists
os.makedirs("uploads", exist_ok=True)
# --- Gradio Interface Functions ---
def upload_pdfs(files):
uploaded_files = []
if isinstance(files, list):
for file in files:
if file is not None:
file_name = os.path.basename(file.name)
file_path = f"uploads/{file_name}"
try:
if hasattr(file, 'read'):
content = file.read()
else:
content = str(file).encode('utf-8')
with open(file_path, "wb") as f:
f.write(content)
uploaded_files.append(file_path)
except Exception as e:
return f"Error processing {file_name}: {str(e)}"
else:
if files is not None:
file_name = os.path.basename(files.name)
file_path = f"uploads/{file_name}"
try:
if hasattr(files, 'read'):
content = files.read()
else:
content = str(files).encode('utf-8')
with open(file_path, "wb") as f:
f.write(content)
uploaded_files.append(file_path)
except Exception as e:
return f"Error processing {file_name}: {str(e)}"
return f"Uploaded {len(uploaded_files)} PDF(s): {', '.join(uploaded_files)}"
def fetch_objects():
sf, error = get_salesforce_client()
if error:
return gr.update(choices=[]), f"Error: {error}"
objects, error = get_salesforce_objects(sf)
if error:
return gr.update(choices=[]), f"Error: {error}"
return gr.update(choices=objects), "Objects fetched successfully"
def fetch_fields(object_name):
sf, error = get_salesforce_client()
if error:
return gr.update(choices=[]), f"Error: {error}"
fields, error = get_object_fields(sf, object_name)
if error:
return gr.update(choices=[]), f"Error: {error}"
return gr.update(choices=fields), "Fields fetched successfully"
def process_pdf(pdf_paths):
if not pdf_paths or not isinstance(pdf_paths, list) or not pdf_paths[0]:
return "Error: No valid PDF file provided"
pdf_path = pdf_paths[0]
text_data, error = extract_text_from_pdf(pdf_path)
if error:
return f"Error: {error}"
kv_pairs, error = extract_key_value_pairs(pdf_path)
if error:
return f"Error: {error}"
return f"Text:\n{text_data}\n\nKey-Value Pairs:\n{kv_pairs}"
def display_mappings(pdf_paths, object_name):
if not pdf_paths or not isinstance(pdf_paths, list) or not pdf_paths[0]:
return "Error: No valid PDF file provided"
pdf_path = pdf_paths[0]
sf, error = get_salesforce_client()
if error:
return f"Error: {error}"
fields, error = get_object_fields(sf, object_name)
if error:
return f"Error: {error}"
extracted_data, error = extract_key_value_pairs(pdf_path)
if error:
return f"Error: {error}"
mappings, confidence_scores, error = map_fields(extracted_data, fields)
if error:
return f"Error: {error}"
output = ""
for key, field in mappings.items():
output += f"{key} -> {field} (Confidence: {confidence_scores[key]})\n"
return output
def migrate_to_salesforce(pdf_paths, object_name):
if not pdf_paths or not isinstance(pdf_paths, list) or not pdf_paths[0]:
return "Error: No valid PDF file provided"
pdf_path = pdf_paths[0]
sf, error = get_salesforce_client()
if error:
log_failure(pdf_path, object_name, error)
return f"Error: {error}"
extracted_data, error = extract_key_value_pairs(pdf_path)
if error:
log_failure(pdf_path, object_name, error)
return f"Error: {error}"
fields, error = get_object_fields(sf, object_name)
if error:
log_failure(pdf_path, object_name, error)
return f"Error: {error}"
mappings, _, error = map_fields(extracted_data, fields)
if error:
log_failure(pdf_path, object_name, error)
return f"Error: {error}"
data = {mappings[key]: value for key, value in zip(extracted_data[0]["keys"], extracted_data[0]["values"])}
record_id, error = create_record(sf, object_name, data)
if error:
log_failure(pdf_path, object_name, error)
return f"Error: {error}"
attach_status, error = attach_pdf(sf, record_id, pdf_path)
if error:
log_failure(pdf_path, object_name, error)
return f"Error: {error}"
return f"β
Record Created: {record_id}\nπ Attachment: {attach_status}"
def display_failures():
try:
with open("failures.json", "r") as f:
failures = [json.loads(line) for line in f]
output = ""
for idx, failure in enumerate(failures):
output += f"Failure {idx + 1}: PDF={failure['pdf']}, Object={failure['object']}, Error={failure['error']}\n"
return output
except FileNotFoundError:
return "No failures logged"
def retry_migration(pdf_path, object_name):
return migrate_to_salesforce([pdf_path], object_name)
# --- Gradio App Layout ---
with gr.Blocks(css="footer {display: none !important;}") as app:
gr.Markdown("# π§ Smart Contract Migrator")
with gr.Tab("π Upload & Process PDF"):
with gr.Row():
pdf_upload = gr.File(label="Upload Contract PDFs", file_count="multiple", file_types=[".pdf"])
upload_status = gr.Textbox(label="Status", interactive=False)
pdf_upload.change(upload_pdfs, inputs=pdf_upload, outputs=upload_status)
with gr.Row():
process_button = gr.Button("Extract Info")
process_output = gr.Textbox(label="Text & Key-Value Output", lines=6, interactive=False)
process_button.click(process_pdf, inputs=pdf_upload, outputs=process_output)
with gr.Tab("π Salesforce Integration"):
with gr.Row():
fetch_objects_button = gr.Button("π Get Objects")
object_dropdown = gr.Dropdown(label="Salesforce Object")
object_status = gr.Textbox(label="Status", interactive=False)
fetch_objects_button.click(fetch_objects, outputs=[object_dropdown, object_status])
with gr.Row():
fetch_fields_button = gr.Button("π Get Fields")
field_checkboxes = gr.CheckboxGroup(label="Fields")
field_status = gr.Textbox(label="Status", interactive=False)
fetch_fields_button.click(fetch_fields, inputs=object_dropdown, outputs=[field_checkboxes, field_status])
with gr.Row():
map_button = gr.Button("π Map Fields")
mapping_output = gr.Textbox(label="Mappings", lines=6, interactive=False)
map_button.click(display_mappings, inputs=[pdf_upload, object_dropdown], outputs=mapping_output)
with gr.Row():
migrate_button = gr.Button("π Migrate to Salesforce")
migrate_output = gr.Textbox(label="Migration Result", lines=4, interactive=False)
migrate_button.click(migrate_to_salesforce, inputs=[pdf_upload, object_dropdown], outputs=migrate_output)
with gr.Tab("π§Ύ Reconciliation"):
with gr.Row():
show_failures_button = gr.Button("π Show Failures")
failures_output = gr.Textbox(label="Failures", lines=6, interactive=False)
show_failures_button.click(display_failures, outputs=failures_output)
with gr.Row():
pdf_path_input = gr.Textbox(label="PDF Path to Retry")
retry_button = gr.Button("π Retry")
retry_output = gr.Textbox(label="Retry Status", interactive=False)
retry_button.click(retry_migration, inputs=[pdf_path_input, object_dropdown], outputs=retry_output)
# --- Launch App ---
app.launch()
|