import os import gradio as gr from pdf2image import convert_from_path from PIL import Image, ImageDraw, ImageFont import json import tempfile # Colors for annotations PARA_COLOR = (255, 0, 0) # Red DATE_COLOR = (0, 255, 0) # Green HOVER_COLOR = (255, 165, 0) # Orange POPLER_PATH = "/usr/bin" def annotate_image(page_img, paragraphs, highlight_id=None): """Draw annotations on image - assuming boxes are already for 300 DPI images""" draw = ImageDraw.Draw(page_img) # Try to load a larger font try: # Try to use a larger font size (32 instead of default) font = ImageFont.truetype("/usr/share/fonts/truetype/dejavu/DejaVuSans.ttf", 32) except: try: font = ImageFont.truetype("arial.ttf", 32) except: # Fallback to default but larger font = ImageFont.load_default() # Try to make default font larger try: font = ImageFont.load_default(size=32) except: pass for para in paragraphs: x1, y1, x2, y2 = map(int, para.get('bbox', [0,0,0,0])) para_id = para.get('paragraph_id', '') # Choose color based on highlight if str(para_id) == str(highlight_id): color = HOVER_COLOR width = 3 else: color = PARA_COLOR width = 2 # Draw rectangle draw.rectangle([x1, y1, x2, y2], outline=color, width=width) # Draw paragraph ID with SAME COLOR AS BOX (not black) draw.text((x1 + 5, y1 + 5), str(para_id), fill=color, font=font) # Draw dates for date in para.get('dates', []): dx1, dy1, dx2, dy2 = map(int, date.get('bbox', [0,0,0,0])) date_id = date.get('date_id', '') draw.rectangle([dx1, dy1, dx2, dy2], outline=DATE_COLOR, width=2) # Draw date ID without "D" prefix, SAME COLOR AS BOX (not black) draw.text((dx1 + 5, dy1 + 5), str(date_id), fill=DATE_COLOR, font=font) return page_img def process_documents(pdf_path, json_path, page_num=1, highlight_id=None): """Main processing function - converts at 300 DPI to match JSON annotations""" try: # Load JSON with open(json_path, 'r') as f: data = json.load(f) # Convert PDF page at 300 DPI (to match your JSON annotations) pages = convert_from_path( pdf_path, dpi=300, # CHANGED FROM 150 TO 300 first_page=page_num, last_page=page_num, poppler_path=POPLER_PATH ) if not pages: return None, "No content", 1, "1" page_img = pages[0] # Get PDF name for JSON lookup pdf_name = os.path.splitext(os.path.basename(pdf_path))[0] page_key = f"{pdf_name}_page_{page_num}" # Get paragraphs for this page paragraphs = data.get(page_key, {}).get("paragraphs", []) # Annotate image annotated_img = annotate_image(page_img.copy(), paragraphs, highlight_id) # Save temp image temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".png") annotated_img.save(temp_file.name) # Generate side panel HTML (text) - ALL TEXT IN BLACK (SIDE PANEL ONLY) with scrollable container text_content = f"""

Page {page_num}

""" for para in paragraphs: para_id = para.get("paragraph_id", "") llm_text = para.get("llm_text", "No text") if str(para_id) == str(highlight_id): para_style = "background-color: #fff3cd; padding: 10px; margin: 5px; border-left: 4px solid #ffc107;" else: para_style = "background-color: #f8f9fa; padding: 10px; margin: 5px; border-left: 2px solid #ddd;" text_content += f"""

Paragraph {para_id}

{llm_text}

""" # Add dates if present - ALL TEXT IN BLACK (SIDE PANEL ONLY) dates = para.get("dates", []) if dates: text_content += """

Dates:

""" for date in dates: date_id = date.get("date_id", "") transcription = date.get("transcription", "N/A") confidence = date.get("confidence", 0) text_content += f"""

Date {date_id}: {transcription} ({confidence:.1%})

""" text_content += "

" text_content += "

" # Close scrollable container return temp_file.name, text_content, page_num, "?" except Exception as e: return None, f"

Error: {str(e)}

", page_num, "1" def get_total_pages(pdf_path): """Get total pages in PDF""" try: from pdf2image import pdfinfo_from_path info = pdfinfo_from_path(pdf_path, poppler_path=POPLER_PATH) return info["Pages"] except Exception as e: print("PDF info error:", e) return 1 # ---------------- GRADIO INTERFACE ---------------- # with gr.Blocks() as demo: gr.Markdown("# PDF Annotation Viewer") gr.Markdown("Upload a PDF and JSON file to view annotations") current_page = gr.State(1) current_pdf = gr.State(None) current_json = gr.State(None) total_pages = gr.State(1) with gr.Row(): pdf_input = gr.File(label="PDF File", file_types=[".pdf"]) json_input = gr.File(label="JSON File", file_types=[".json"]) with gr.Row(): with gr.Column(scale=2): with gr.Row(): prev_btn = gr.Button("← Prev") page_display = gr.Number(value=1, label="Page", minimum=1, interactive=True) next_btn = gr.Button("Next →") total_display = gr.Textbox("?", label="of", interactive=False) image_output = gr.Image(label="Annotated Page", type="filepath", height=600) with gr.Column(scale=1): # Text output with fixed height to match image text_output = gr.HTML( label="Text Content", value="

Upload files to begin

" ) highlight_input = gr.Textbox(visible=False) # ----------------- FUNCTIONS ----------------- # def load_files(pdf_file, json_file): if not pdf_file or not json_file: return None, "Please upload both files", 1, "?", None, None, 1 try: total = get_total_pages(pdf_file.name) image_path, text, page_num, _ = process_documents(pdf_file.name, json_file.name, 1) return image_path, text, 1, str(total), pdf_file, json_file, total except Exception as e: return None, f"Error loading files: {str(e)}", 1, "?", None, None, 1 def update_page(page_num, pdf_file, json_file, highlight=None): if not pdf_file or not json_file: return None, "Files not loaded", page_num, "?" image_path, text, _, _ = process_documents(pdf_file.name, json_file.name, page_num, highlight) return image_path, text, page_num, "" def navigate(direction, current, total, pdf_file, json_file, highlight): current = int(current) total = int(total) if direction == "next" and current < total: new_page = current + 1 elif direction == "prev" and current > 1: new_page = current - 1 else: new_page = current return update_page(new_page, pdf_file, json_file, highlight) def text_click(evt: gr.SelectData): return str(evt.index) if evt.index else "" # ----------------- EVENTS ----------------- # pdf_input.change( load_files, inputs=[pdf_input, json_input], outputs=[image_output, text_output, current_page, total_display, current_pdf, current_json, total_pages] ) json_input.change( load_files, inputs=[pdf_input, json_input], outputs=[image_output, text_output, current_page, total_display, current_pdf, current_json, total_pages] ) text_output.select( text_click, None, highlight_input ).then( update_page, [current_page, current_pdf, current_json, highlight_input], [image_output, text_output, page_display, highlight_input] ) prev_btn.click( navigate, inputs=[gr.Text("prev", visible=False), current_page, total_pages, current_pdf, current_json, highlight_input], outputs=[image_output, text_output, page_display, highlight_input] ) next_btn.click( navigate, inputs=[gr.Text("next", visible=False), current_page, total_pages, current_pdf, current_json, highlight_input], outputs=[image_output, text_output, page_display, highlight_input] ) page_display.change( update_page, inputs=[page_display, current_pdf, current_json, highlight_input], outputs=[image_output, text_output, current_page, highlight_input] ) if __name__ == "__main__": demo.launch()