Spaces:

doeqoth
/

pdfk

Running

App Files Files Community

PISAN commited on Jun 7, 2025

Commit

c5d7fde

verified ·

1 Parent(s): 057c155

Update app.py

Browse files

Files changed (1) hide show

app.py +384 -441

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 import gradio as gr
 import pandas as pd
 import json
@@ -7,35 +8,62 @@ from datetime import datetime
 import traceback
 import tempfile
 import os
-# ติดตั้ง dependencies ที่จำเป็น
 try:
     from PyPDF2 import PdfReader, PdfWriter
     from reportlab.pdfgen import canvas
     from reportlab.lib.pagesizes import letter
     from reportlab.pdfbase import pdfmetrics
     from reportlab.pdfbase.ttfonts import TTFont
-except ImportError as e:
-    print(f"กำลังติดตั้ง dependencies: {e}")
-    import subprocess
-    import sys
     subprocess.check_call([sys.executable, "-m", "pip", "install", "PyPDF2", "reportlab", "pandas"])
     from PyPDF2 import PdfReader, PdfWriter
     from reportlab.pdfgen import canvas
     from reportlab.lib.pagesizes import letter
 def analyze_pdf_fields(pdf_path):
-    """วิเคราะห์ฟิลด์ใน PDF"""
     try:
         reader = PdfReader(pdf_path)
         all_fields = {}
         # ตรวจสอบจาก AcroForm
         if reader.trailer.get("/Root") and reader.trailer["/Root"].get("/AcroForm"):
             acro_form = reader.trailer["/Root"]["/AcroForm"]
             if "/Fields" in acro_form:
-                fields = acro_form["/Fields"]
-                for field in fields:
                     field_obj = field.get_object()
                     if "/T" in field_obj:
                         field_name = str(field_obj["/T"]).strip("()")
@@ -46,28 +74,22 @@ def analyze_pdf_fields(pdf_path):
                             'default_value': field_value,
                             'method': 'AcroForm'
                         }
-        # ตรวจสอบจาก Annotations
         for page_num, page in enumerate(reader.pages):
             if "/Annots" in page:
-                try:
-                    annotations = page["/Annots"]
-                    for annotation in annotations:
-                        annot_obj = annotation.get_object()
-                        if annot_obj.get("/Subtype") == "/Widget":
-                            if "/T" in annot_obj:
-                                field_name = str(annot_obj["/T"]).strip("()")
-                                field_type = str(annot_obj.get("/FT", "Widget"))
-                                field_value = str(annot_obj.get("/V", "")).strip("()")
-                                all_fields[field_name] = {
-                                    'type': field_type,
-                                    'default_value': field_value,
-                                    'page': page_num + 1,
-                                    'method': 'Annotation'
-                                }
-                except Exception:
-                    continue
         return all_fields
     except Exception as e:
         return {"error": str(e)}
@@ -76,42 +98,12 @@ def generate_csv_template(pdf_fields, num_rows=5):
     """สร้าง CSV template จาก PDF fields"""
     if not pdf_fields or "error" in pdf_fields:
         return None, "ไม่สามารถสร้าง CSV template ได้"
-    # สร้าง DataFrame ว่าง
-    template_data = {}
-    # เพิ่มคอลัมน์ ID
-    template_data['id'] = list(range(1, num_rows + 1))
-    # เพิ่มคอลัมน์จาก PDF fields
-    for field_name, field_info in pdf_fields.items():
         if field_name and field_name.strip():
             clean_name = field_name.strip()
-            # ใส่ค่าตัวอย่าง
-            if field_info.get('default_value') and field_info['default_value'].strip():
-                sample_value = field_info['default_value']
-            else:
-                # สร้างค่าตัวอย่าง
-                if 'name' in clean_name.lower():
-                    sample_value = f"ชื่อตัวอย่าง {{}}"
-                elif 'date' in clean_name.lower() or 'วันที่' in clean_name:
-                    sample_value = "2024-01-01"
-                elif 'email' in clean_name.lower():
-                    sample_value = "example{}@email.com"
-                elif 'phone' in clean_name.lower() or 'เบอร์' in clean_name:
-                    sample_value = "08-1234-567{}"
-                elif 'address' in clean_name.lower() or 'ที่อยู่' in clean_name:
-                    sample_value = "123 ถนนตัวอย่าง กรุงเทพ {}"
-                else:
-                    sample_value = f"ข้อมูลตัวอย่าง {{}}"
-            # สร้างข้อมูลตัวอย่าง
-            template_data[clean_name] = [
-                sample_value.format(i) if '{}' in sample_value else sample_value
-                for i in range(1, num_rows + 1)
-            ]
-    # สร้าง DataFrame
     df = pd.DataFrame(template_data)
     return df, "สร้าง CSV template สำเร็จ"
@@ -119,503 +111,454 @@ def generate_json_template(pdf_fields):
     """สร้าง JSON template จาก PDF fields"""
     if not pdf_fields or "error" in pdf_fields:
         return None, "ไม่สามารถสร้าง JSON template ได้"
     template = {
-        "pdf_info": {
-            "total_fields": len(pdf_fields),
-            "generation_time": datetime.now().isoformat()
-        },
         "fields": {},
         "sample_data": []
     }
-    # เพิ่มข้อมูล fields
     for field_name, field_info in pdf_fields.items():
         if field_name and field_name.strip():
-            clean_name = field_name.strip()
-            template["fields"][clean_name] = {
-                "type": field_info.get('type', 'Unknown'),
-                "default_value": field_info.get('default_value', ''),
-                "page": field_info.get('page', 1),
-                "method": field_info.get('method', 'Unknown')
-            }
-    # สร้างข้อมูลตัวอย่าง
-    for i in range(1, 4):  # 3 ตัวอย่าง
         sample_record = {"id": i}
         for field_name in template["fields"].keys():
-            if 'name' in field_name.lower():
-                sample_record[field_name] = f"ชื่อตัวอย่าง {i}"
-            elif 'date' in field_name.lower() or 'วันที่' in field_name:
-                sample_record[field_name] = f"2024-0{i}-01"
-            elif 'email' in field_name.lower():
-                sample_record[field_name] = f"example{i}@email.com"
-            else:
-                sample_record[field_name] = f"ข้อมูลตัวอย่าง {i}"
         template["sample_data"].append(sample_record)
     return template, "สร้าง JSON template สำเร็จ"
-def create_template_files(pdf_file, num_rows=5):
-    """สร้างไฟล์ template ทั้งหมด"""
     if pdf_file is None:
-        return None, None, "❌ กรุณาอัพโหลดไฟล์ PDF"
     try:
-        # วิเคราะห์ PDF
-        pdf_fields = analyze_pdf_fields(pdf_file)
         if not pdf_fields or "error" in pdf_fields:
-            return None, None, "❌ ไม่พบ form fields ใน PDF หรือไม่สามารถอ่านได้"
-        # สร้าง CSV template
-        csv_df, csv_msg = generate_csv_template(pdf_fields, num_rows)
-        # สร้าง JSON template
-        json_template, json_msg = generate_json_template(pdf_fields)
         if csv_df is None or json_template is None:
-            return None, None, "❌ ไม่สามารถสร้าง template ได้"
-        # สร้าง ZIP file
         zip_buffer = io.BytesIO()
         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
-        with zipfile.ZipFile(zip_buffer, 'w', zipfile.ZIP_DEFLATED) as zip_file:
-            # เพิ่ม CSV
             csv_buffer = io.StringIO()
             csv_df.to_csv(csv_buffer, index=False, encoding='utf-8-sig')
-            zip_file.writestr(f"template_{timestamp}.csv", csv_buffer.getvalue())
-            # เพิ่ม JSON
             json_str = json.dumps(json_template, ensure_ascii=False, indent=2)
-            zip_file.writestr(f"template_{timestamp}.json", json_str)
-            # เพิ่ม README
             readme_content = f"""# PDF Form Template Files
 Generated on: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}
-## Files included:
-1. template_{timestamp}.csv - CSV template with sample data
-2. template_{timestamp}.json - JSON template with field information
-## PDF Fields Found: {len(pdf_fields)}
-{chr(10).join([f"- {name}: {info.get('type', 'Unknown')}" for name, info in pdf_fields.items()])}
-## How to use:
-1. Edit the CSV file with your actual data
-2. Use the CSV file with the original PDF form filler
-3. The JSON file contains detailed field information for reference
-## Note:
-- Make sure column names in CSV match the field names in PDF
-- You can add more rows to the CSV as needed
-- Keep the column headers exactly as shown
 """
-            zip_file.writestr("README.txt", readme_content)
         zip_buffer.seek(0)
-        # บันทึกไฟล์ชั่วคราว
-        temp_zip_path = os.path.join(tempfile.gettempdir(), f"pdf_templates_{timestamp}.zip")
-        with open(temp_zip_path, 'wb') as f:
             f.write(zip_buffer.getvalue())
-        result_msg = f"✅ สร้าง template สำเร็จ!\n"
-        result_msg += f"🔍 พบ {len(pdf_fields)} fields ใน PDF\n"
-        result_msg += f"📄 CSV template: {num_rows} แถวตัวอย่าง\n"
-        result_msg += f"📋 JSON template: รายละเอียดครบถ้วน\n"
-        result_msg += f"📁 README: คำแนะนำการใช้งาน"
-        return temp_zip_path, pdf_fields, result_msg
     except Exception as e:
-        return None, None, f"❌ เกิดข้อผิดพลาด: {str(e)}"
 def fill_pdf_form(pdf_path, field_data):
-    """เติมข้อมูลในฟอร์ม PDF"""
-    try:
-        reader = PdfReader(pdf_path)
-        writer = PdfWriter()
-        # คัดลอกหน้าทั้งหมด
-        for page in reader.pages:
-            writer.add_page(page)
-        # เติมข้อมูลในฟอร์ม
-        if hasattr(writer, 'update_page_form_field_values'):
-            for page_num, page in enumerate(writer.pages):
-                try:
-                    writer.update_page_form_field_values(page, field_data)
-                except Exception:
-                    pass
-        # ลองวิธีอื่น
-        elif "/AcroForm" in reader.trailer.get("/Root", {}):
-            try:
-                acro_form = reader.trailer["/Root"]["/AcroForm"]
-                if "/Fields" in acro_form:
-                    fields = acro_form["/Fields"]
-                    for field in fields:
-                        field_obj = field.get_object()
-                        if "/T" in field_obj:
-                            field_name = str(field_obj["/T"]).strip("()")
-                            if field_name in field_data:
-                                try:
-                                    field_obj.update({"/V": field_data[field_name]})
-                                except Exception:
-                                    pass
-            except Exception:
-                pass
-        return writer
-    except Exception as e:
-        raise Exception(f"ไม่สามารถเติมฟอร์มได้: {str(e)}")
 def create_simple_pdf(data_row, filename):
-    """สร้าง PDF ใหม่แบบง่าย"""
     buffer = io.BytesIO()
     p = canvas.Canvas(buffer, pagesize=letter)
     width, height = letter
-    # ตั้งค่า font
-    p.setFont("Helvetica", 12)
-    # หัวเรื่อง
-    p.setFont("Helvetica-Bold", 16)
-    title = f"Document: {filename.replace('.pdf', '')}"
-    p.drawString(50, height - 50, title)
     p.line(50, height - 60, 550, height - 60)
-    # เนื้อหา
-    y_position = height - 100
-    p.setFont("Helvetica", 12)
     for column, value in data_row.items():
         if pd.notna(value) and str(value).strip():
-            clean_column = str(column).strip()
-            clean_value = str(value).strip()
-            if len(clean_value) > 80:
-                clean_value = clean_value[:77] + "..."
-            text = f"{clean_column}: {clean_value}"
             try:
                 p.drawString(50, y_position, text)
             except:
-                safe_text = text.encode('ascii', errors='ignore').decode('ascii')
                 p.drawString(50, y_position, safe_text)
-            y_position -= 25
             if y_position < 50:
                 p.showPage()
-                p.setFont("Helvetica", 12)
                 y_position = height - 50
-    # เวลาที่สร้าง
-    p.setFont("Helvetica", 8)
-    timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-    p.drawString(50, 30, f"Created: {timestamp}")
     p.save()
     buffer.seek(0)
     return buffer.getvalue()
-def process_single_row(pdf_path, row_data, filename, use_form=True):
-    """ประมวลผลแถวเดียว"""
-    try:
-        # เตรียมข้อมูลฟิลด์
-        field_data = {}
-        for column, value in row_data.items():
-            if pd.notna(value) and str(value).strip():
-                clean_value = str(value).strip()
-                clean_column = str(column).strip()
-                # ลองหลายรูปแบบของชื่อฟิลด์
-                field_variations = [
-                    clean_column,
-                    clean_column.lower(),
-                    clean_column.upper(),
-                    clean_column.replace('_', ' '),
-                    clean_column.replace(' ', '_'),
-                    clean_column.replace('-', '_'),
-                    clean_column.replace('_', '')
-                ]
-                for variation in field_variations:
-                    field_data[variation] = clean_value
-        if use_form:
-            try:
-                # ลองเติมฟอร์ม
-                writer = fill_pdf_form(pdf_path, field_data)
-                output_buffer = io.BytesIO()
-                writer.write(output_buffer)
-                output_buffer.seek(0)
-                return output_buffer.getvalue(), "form_filled"
-            except Exception as e:
-                # ถ้าไม่ได้ ให้สร้างใหม่
-                pdf_content = create_simple_pdf(row_data, filename)
-                return pdf_content, f"new_pdf_created: {str(e)}"
-        else:
-            # สร้าง PDF ใหม่
-            pdf_content = create_simple_pdf(row_data, filename)
-            return pdf_content, "new_pdf_created"
-    except Exception as e:
-        return None, f"error: {str(e)}"
 def read_csv_safe(csv_file):
-    """อ่าน CSV อย่างปลอดภัย"""
-    encodings = ['utf-8', 'utf-8-sig', 'cp874', 'tis-620', 'iso-8859-1', 'cp1252']
-    separators = [',', ';', '\t', '|']
     for encoding in encodings:
         for sep in separators:
             try:
-                df = pd.read_csv(csv_file, encoding=encoding, sep=sep, engine='python')
-                if len(df.columns) > 1 and len(df) > 0:
                     return df, None
             except Exception:
                 continue
-    try:
-        df = pd.read_csv(csv_file)
-        return df, None
-    except Exception as e:
-        return None, str(e)
 def process_pdf_csv(pdf_file, csv_file, filename_column, file_prefix, use_form_fields, progress=gr.Progress()):
     """ฟังก์ชันหลักสำหรับประมวลผล PDF และ CSV"""
-    if pdf_file is None or csv_file is None:
-        return None, "❌ กรุณาอัพโหลดไฟล์ PDF และ CSV"
     try:
-        # อ่าน CSV
         df, csv_error = read_csv_safe(csv_file)
         if df is None:
             return None, f"❌ ไม่สามารถอ่าน CSV ได้: {csv_error}"
-        # วิเคราะห์ PDF
-        pdf_fields = analyze_pdf_fields(pdf_file)
-        has_form_fields = bool(pdf_fields and "error" not in pdf_fields and pdf_fields)
-        # เก็บ PDF ที่สร้าง
         generated_pdfs = {}
-        success_count = 0
-        error_count = 0
-        processing_log = []
-        # ประมวลผลแต่ละแถว
-        for index, (_, row) in enumerate(df.iterrows()):
-            progress((index + 1) / len(df), f"ประมวลผล {index + 1}/{len(df)}")
             try:
-                # สร้างชื่อไฟล์
-                if filename_column and filename_column in df.columns and pd.notna(row[filename_column]):
-                    safe_name = str(row[filename_column]).strip()
-                    safe_name = "".join(c for c in safe_name if c.isalnum() or c in (' ', '-', '_')).strip()
-                    filename = f"{file_prefix}_{safe_name}.pdf"
                 else:
-                    filename = f"{file_prefix}_{index + 1:03d}.pdf"
-                filename = filename.replace('  ', ' ').replace(' ', '_')
-                if not filename.endswith('.pdf'):
-                    filename += '.pdf'
-                # ประมวลผล
-                pdf_content, status = process_single_row(
-                    pdf_file,
-                    row,
-                    filename,
-                    use_form_fields and has_form_fields
-                )
-                if pdf_content is not None:
-                    generated_pdfs[filename] = pdf_content
-                    success_count += 1
-                    processing_log.append(f"✅ {filename}: {status}")
-                else:
-                    error_count += 1
-                    processing_log.append(f"❌ {filename}: {status}")
             except Exception as e:
-                error_count += 1
-                processing_log.append(f"💥 แถว {index + 1}: {str(e)}")
-        # สร้าง ZIP
-        if generated_pdfs:
-            zip_buffer = io.BytesIO()
-            with zipfile.ZipFile(zip_buffer, 'w', zipfile.ZIP_DEFLATED) as zip_file:
-                for filename, pdf_content in generated_pdfs.items():
-                    zip_file.writestr(filename, pdf_content)
-            zip_buffer.seek(0)
-            # สร้างชื่อไฟล์ ZIP
-            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
-            zip_filename = f"generated_pdfs_{timestamp}.zip"
-            # บันทึกไฟล์ชั่วคราว
-            temp_zip_path = os.path.join(tempfile.gettempdir(), zip_filename)
-            with open(temp_zip_path, 'wb') as f:
-                f.write(zip_buffer.getvalue())
-            result_message = f"✅ สร้าง PDF สำเร็จ {success_count} ไฟล์!"
-            if error_count > 0:
-                result_message += f"\n⚠️ มีข้อผิดพลาด {error_count} ไฟล์"
-            result_message += f"\n\n📋 รายละเอียด:\n" + "\n".join(processing_log[:10])
-            if len(processing_log) > 10:
-                result_message += f"\n... และอีก {len(processing_log) - 10} รายการ"
-            return temp_zip_path, result_message
-        else:
-            return None, "❌ ไม่สามารถสร้าง PDF ได้เลย"
     except Exception as e:
-        return None, f"❌ เกิ���ข้อผิดพลาด: {str(e)}\n{traceback.format_exc()}"
 def analyze_pdf_info(pdf_file):
-    """วิเคราะห์ข้อมูล PDF"""
     if pdf_file is None:
         return "ยังไม่มีไฟล์ PDF"
     try:
-        reader = PdfReader(pdf_file)
-        info = f"📄 **ข้อมูล PDF:**\n"
-        info += f"- จำนวนหน้า: {len(reader.pages)}\n"
-        # ตรวจสอบฟิลด์
-        pdf_fields = analyze_pdf_fields(pdf_file)
-        if pdf_fields and "error" not in pdf_fields and pdf_fields:
-            info += f"- จำนวน Form Fields: {len(pdf_fields)}\n"
-            info += f"\n🏷️ **รายชื่อ Fields:**\n"
-            for name, details in list(pdf_fields.items())[:10]:  # แสดงแค่ 10 ตัวแรก
-                info += f"  - {name} ({details.get('type', 'Unknown')})\n"
             if len(pdf_fields) > 10:
                 info += f"  - ... และอีก {len(pdf_fields) - 10} fields\n"
         else:
-            info += "- Form Fields: ไม่พบหรือไม่สามารถอ่านได้\n"
-            info += "- หมายเหตุ: จะสร้าง PDF ใหม่แทน\n"
         return info
     except Exception as e:
-        return f"❌ ไม่สามารถวิเคราะห์ PDF ได้: {str(e)}"
 def analyze_csv_info(csv_file):
-    """วิเคราะห์ข้อมูล CSV"""
     if csv_file is None:
-        return "ยังไม่มีไฟล์ CSV"
     try:
         df, error = read_csv_safe(csv_file)
         if df is None:
-            return f"❌ ไม่สามารถอ่าน CSV ได้: {error}"
-        info = f"📋 **ข้อมูล CSV:**\n"
-        info += f"- จำนวนแถว: {len(df)}\n"
-        info += f"- จำนวนคอลัมน์: {len(df.columns)}\n"
-        info += f"\n📝 **รายชื่อคอลัมน์:**\n"
-        for col in df.columns[:15]:  # แสดงแค่ 15 คอลัมน์แรก
-            info += f"  - {col}\n"
         if len(df.columns) > 15:
             info += f"  - ... และอีก {len(df.columns) - 15} คอลัมน์\n"
-        # ตรวจสอบข้อมูลที่ขาด
-        missing_data = df.isnull().sum()
-        if missing_data.any():
-            missing_cols = missing_data[missing_data > 0]
-            if len(missing_cols) > 0:
-                info += f"\n⚠️ **ข้อมูลที่ขาดหาย:**\n"
-                for col, count in missing_cols.head(5).items():
-                    info += f"  - {col}: {count} แถว\n"
-        return info
     except Exception as e:
-        return f"❌ ไม่ส���มารถวิเคราะห์ CSV ได้: {str(e)}"
-# สร้าง Gradio Interface
 def create_interface():
     with gr.Blocks(title="PDF Form Filler & Template Generator", theme=gr.themes.Soft()) as app:
-        gr.Markdown("""
-        # 📄 เครื่องมือเติมข้อมูล PDF จาก CSV + สร้าง Template
-        **เครื่องมือนี้สามารถ:**
-        - 🔄 **สร้าง CSV/JSON Template จาก PDF** (Reverse Engineering)
-        - 📝 เติมข้อมูลลงในฟอร์ม PDF ที่มี form fields
-        - 🆕 สร้าง PDF ใหม่หากไม่มี form fields หรือเติมไม่ได้
-        - 🌐 รองรับ CSV หลาย encoding (UTF-8, TIS-620, CP874, etc.)
-        - 📦 ส่งออกเป็นไฟล์ ZIP
-        """)
         with gr.Tabs():
-            # Tab 1: Template Generator
-            with gr.TabItem("🔄 สร้าง Template"):
-                gr.Markdown("""
-                ## 🔄 สร้าง CSV/JSON Template จาก PDF
-                **อัพโหลด PDF ที่มี form fields แล้วสร้าง template ให้อัตโนมัติ**
-                """)
                 with gr.Row():
                     with gr.Column(scale=1):
-                        template_pdf = gr.File(
-                            label="📄 PDF ที่ต้องการสร้าง Template",
-                            file_types=[".pdf"],
-                            type="filepath"
-                        )
-                        num_sample_rows = gr.Slider(
-                            label="จำนวนแถวตัวอย่างใน CSV",
-                            minimum=1,
-                            maximum=20,
-                            value=5,
-                            step=1
-                        )
-                        generate_template_btn = gr.Button(
-                            "🔄 สร้าง Template",
-                            variant="primary",
-                            size="lg"
-                        )
                     with gr.Column(scale=2):
-                        template_pdf_info = gr.Markdown("ยังไม่มีไฟล์ PDF")
-                        template_result_file = gr.File(
-                            label="📦 ไฟล์ Template (ZIP)",
-                            visible=False
-                        )
-                        template_result_message = gr.Markdown("")
-            # Tab 2: PDF Form Filler
-            with gr.TabItem("📝 เติมข้อมูล PDF"):
-                gr.Markdown("""
-                ## 📝 เติมข้อมูล PDF จาก CSV
-                **ใช้ CSV ที่สร้างจาก Template หรือ CSV ของคุณเอง**
-                """)
                 with gr.Row():
                     with gr.Column(scale=1):
-                        gr.Markdown("### 📁 อัพโหลดไฟล์")
-                        pdf_file = gr.File(
-                            label="PDF Template",
-                            file_types=[".pdf"],
-                            type="filepath"
-                        )
-                        csv_file = gr.File(
-                            label="CSV Data",
-                            file_types=[".csv"],
-                            type="filepath"
-                        )
-                        gr.Markdown("### ⚙️ ตั้งค่

 import gradio as gr
 import pandas as pd
 import json
 import traceback
 import tempfile
 import os
+import sys
+import subprocess
+# --- ตรวจสอบและติดตั้ง Dependencies ---
 try:
     from PyPDF2 import PdfReader, PdfWriter
     from reportlab.pdfgen import canvas
     from reportlab.lib.pagesizes import letter
     from reportlab.pdfbase import pdfmetrics
     from reportlab.pdfbase.ttfonts import TTFont
+    print("Dependencies หลักถูกติดตั้งเรียบร้อยแล้ว")
+except ImportError:
+    print("กำลังติดตั้ง dependencies ที่จำเป็น: PyPDF2, reportlab, pandas")
     subprocess.check_call([sys.executable, "-m", "pip", "install", "PyPDF2", "reportlab", "pandas"])
     from PyPDF2 import PdfReader, PdfWriter
     from reportlab.pdfgen import canvas
     from reportlab.lib.pagesizes import letter
+# --- Dependencies เสริมสำหรับ AI และ OCR (จะแจ้งเตือนถ้าไม่มี) ---
+try:
+    from PIL import Image
+    import numpy as np
+    import cv2
+    import pytesseract
+    AI_OCR_ENABLED = True
+    print("Dependencies สำหรับ AI/OCR พร้อมใช้งาน")
+except ImportError:
+    AI_OCR_ENABLED = False
+    print("คำเตือน: ไม่พบ Dependencies สำหรับ AI/OCR (Pillow, numpy, opencv-python, pytesseract)")
+    print("ฟังก์ชันที่เกี่ยวกับรูปภาพและ OCR จะไม่สามารถใช้งานได้")
+    print("ติดตั้งด้วย: pip install Pillow numpy opencv-python pytesseract และติดตั้ง Tesseract engine")
+try:
+    from gradio_client import Client
+    SAMBANOVA_AI_ENABLED = True
+    print("Dependencies สำหรับ SambaNova AI พร้อมใช้งาน")
+except ImportError:
+    SAMBANOVA_AI_ENABLED = False
+    print("คำเตือน: ไม่พบ Gradio Client (pip install 'gradio_client>=0.12.0')")
+    print("ฟังก์ชันที่ต้องใช้ AI Model จะไม่สามารถใช้งานได้")
+# ==============================================================================
+# ส่วนของฟังก์ชันหลัก (Core Functions)
+# ==============================================================================
 def analyze_pdf_fields(pdf_path):
+    """วิเคราะห์ฟิลด์ใน PDF และคืนค่าเป็น Dictionary"""
     try:
         reader = PdfReader(pdf_path)
         all_fields = {}
         # ตรวจสอบจาก AcroForm
         if reader.trailer.get("/Root") and reader.trailer["/Root"].get("/AcroForm"):
             acro_form = reader.trailer["/Root"]["/AcroForm"]
             if "/Fields" in acro_form:
+                for field in acro_form["/Fields"]:
                     field_obj = field.get_object()
                     if "/T" in field_obj:
                         field_name = str(field_obj["/T"]).strip("()")
                             'default_value': field_value,
                             'method': 'AcroForm'
                         }
+        # ตรวจสอบจาก Annotations ในแต่ละหน้า
         for page_num, page in enumerate(reader.pages):
             if "/Annots" in page:
+                for annotation in page["/Annots"]:
+                    annot_obj = annotation.get_object()
+                    if annot_obj.get("/Subtype") == "/Widget" and "/T" in annot_obj:
+                        field_name = str(annot_obj["/T"]).strip("()")
+                        if field_name not in all_fields: # เพิ่มเฉพาะที่ยังไม่มี
+                            field_type = str(annot_obj.get("/FT", "Widget"))
+                            field_value = str(annot_obj.get("/V", "")).strip("()")
+                            all_fields[field_name] = {
+                                'type': field_type,
+                                'default_value': field_value,
+                                'page': page_num + 1,
+                                'method': 'Annotation'
+                            }
         return all_fields
     except Exception as e:
         return {"error": str(e)}
     """สร้าง CSV template จาก PDF fields"""
     if not pdf_fields or "error" in pdf_fields:
         return None, "ไม่สามารถสร้าง CSV template ได้"
+    template_data = {'id': list(range(1, num_rows + 1))}
+    for field_name in pdf_fields.keys():
         if field_name and field_name.strip():
             clean_name = field_name.strip()
+            sample_value = f"ข้อมูลสำหรับ {clean_name} {{}}"
+            template_data[clean_name] = [sample_value.format(i) for i in range(1, num_rows + 1)]
     df = pd.DataFrame(template_data)
     return df, "สร้าง CSV template สำเร็จ"
     """สร้าง JSON template จาก PDF fields"""
     if not pdf_fields or "error" in pdf_fields:
         return None, "ไม่สามารถสร้าง JSON template ได้"
     template = {
+        "pdf_info": {"total_fields": len(pdf_fields), "generation_time": datetime.now().isoformat()},
         "fields": {},
         "sample_data": []
     }
     for field_name, field_info in pdf_fields.items():
         if field_name and field_name.strip():
+            template["fields"][field_name.strip()] = field_info
+    for i in range(1, 4):
         sample_record = {"id": i}
         for field_name in template["fields"].keys():
+            sample_record[field_name] = f"ข้อมูลตัวอย่าง {i}"
         template["sample_data"].append(sample_record)
     return template, "สร้าง JSON template สำเร็จ"
+def create_template_files(pdf_file, num_rows, progress=gr.Progress()):
+    """สร้างไฟล์ template (CSV, JSON, README) และรวมเป็น ZIP"""
     if pdf_file is None:
+        return None, "❌ กรุณาอัพโหลดไฟล์ PDF ก่อน"
+    progress(0, desc="กำลังวิเคราะห์ PDF...")
     try:
+        pdf_fields = analyze_pdf_fields(pdf_file.name)
         if not pdf_fields or "error" in pdf_fields:
+            return None, "❌ ไม่พบ Form Fields ใน PDF หรือไฟล์เสียหาย"
+        progress(0.3, desc="กำลังสร้าง CSV template...")
+        csv_df, _ = generate_csv_template(pdf_fields, num_rows)
+        progress(0.6, desc="กำลังสร้าง JSON template...")
+        json_template, _ = generate_json_template(pdf_fields)
         if csv_df is None or json_template is None:
+            return None, "❌ ไม่สามารถสร้างไฟล์ template ได้"
+        progress(0.8, desc="กำลังบีบอัดไฟล์เป็น ZIP...")
         zip_buffer = io.BytesIO()
         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        with zipfile.ZipFile(zip_buffer, 'w', zipfile.ZIP_DEFLATED) as zip_f:
             csv_buffer = io.StringIO()
             csv_df.to_csv(csv_buffer, index=False, encoding='utf-8-sig')
+            zip_f.writestr(f"template_{timestamp}.csv", csv_buffer.getvalue())
             json_str = json.dumps(json_template, ensure_ascii=False, indent=2)
+            zip_f.writestr(f"template_{timestamp}.json", json_str)
             readme_content = f"""# PDF Form Template Files
 Generated on: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}
+PDF Fields Found: {len(pdf_fields)}
+{chr(10).join([f"- {name}" for name in pdf_fields.keys()])}
 """
+            zip_f.writestr("README.txt", readme_content)
         zip_buffer.seek(0)
+        # บันทึกไฟล์ ZIP ชั่วคราวเพื่อให้ Gradio ส่งให้ผู้ใช้ได้
+        temp_dir = tempfile.gettempdir()
+        zip_filename = f"pdf_templates_{timestamp}.zip"
+        temp_zip_path = os.path.join(temp_dir, zip_filename)
+        with open(temp_zip_path, "wb") as f:
             f.write(zip_buffer.getvalue())
+        progress(1, desc="สร้างไฟล์สำเร็จ!")
+        result_msg = f"✅ สร้าง template สำเร็จ!\n- พบ {len(pdf_fields)} fields\n- CSV มี {num_rows} แถวตัวอย่าง"
+        return temp_zip_path, result_msg
     except Exception as e:
+        return None, f"❌ เกิดข้อผิดพลาด: {e}\n{traceback.format_exc()}"
 def fill_pdf_form(pdf_path, field_data):
+    """เติมข้อมูลลงในฟอร์มของ PDF"""
+    reader = PdfReader(pdf_path)
+    writer = PdfWriter()
+    writer.append_pages_from_reader(reader)
+    # เติมข้อมูลในฟอร์ม
+    for page in writer.pages:
+        try:
+            writer.update_page_form_field_values(page, field_data, auto_regenerate=False)
+        except Exception:
+            # บางครั้ง field อยูในระดับ root
+            pass
+    try: # ลองเติมที่ root อีกครั้ง
+        writer.update_page_form_field_values(writer.pages[0], field_data)
+    except:
+        pass
+    output_buffer = io.BytesIO()
+    writer.write(output_buffer)
+    output_buffer.seek(0)
+    return output_buffer.getvalue()
 def create_simple_pdf(data_row, filename):
+    """สร้าง PDF ใหม่แบบง่ายๆ กรณีที่ PDF ต้นฉบับไม่มีฟอร์ม"""
     buffer = io.BytesIO()
+    # ใช้ font ที่รองรับภาษาไทย
+    try:
+        pdfmetrics.registerFont(TTFont('THSarabunNew', 'THSarabunNew.ttf'))
+        font_name = 'THSarabunNew'
+    except:
+        font_name = 'Helvetica' # Fallback
     p = canvas.Canvas(buffer, pagesize=letter)
     width, height = letter
+    p.setFont(font_name, 16)
+    p.drawString(50, height - 50, f"เอกสาร: {filename.replace('.pdf', '')}")
     p.line(50, height - 60, 550, height - 60)
+    y_position = height - 90
+    p.setFont(font_name, 12)
     for column, value in data_row.items():
         if pd.notna(value) and str(value).strip():
+            text = f"{str(column).strip()}: {str(value).strip()}"
             try:
                 p.drawString(50, y_position, text)
             except:
+                safe_text = text.encode('latin-1', 'replace').decode('latin-1')
                 p.drawString(50, y_position, safe_text)
+            y_position -= 20
             if y_position < 50:
                 p.showPage()
+                p.setFont(font_name, 12)
                 y_position = height - 50
     p.save()
     buffer.seek(0)
     return buffer.getvalue()
 def read_csv_safe(csv_file):
+    """อ่านไฟล์ CSV โดยลองหลาย encoding และ separator เพื่อความยืดหยุ่น"""
+    encodings = ['utf-8-sig', 'utf-8', 'cp874', 'tis-620']
+    separators = [',', ';', '\t']
+    # ใช้ .name เพราะ Gradio ส่งมาเป็น object ที่มี path อยู่ใน .name
+    filepath = csv_file.name
     for encoding in encodings:
         for sep in separators:
             try:
+                df = pd.read_csv(filepath, encoding=encoding, sep=sep, engine='python')
+                if len(df.columns) > 1:
                     return df, None
             except Exception:
                 continue
+    return None, "ไม่สามารถอ่านไฟล์ CSV ได้ ลองตรวจสอบ Encoding (ควรเป็น UTF-8) และ Separator (ควรเป็น ,)"
 def process_pdf_csv(pdf_file, csv_file, filename_column, file_prefix, use_form_fields, progress=gr.Progress()):
     """ฟังก์ชันหลักสำหรับประมวลผล PDF และ CSV"""
+    if not pdf_file or not csv_file:
+        return None, "❌ กรุณาอัพโหลดทั้งไฟล์ PDF และ CSV"
     try:
         df, csv_error = read_csv_safe(csv_file)
         if df is None:
             return None, f"❌ ไม่สามารถอ่าน CSV ได้: {csv_error}"
+        pdf_path = pdf_file.name
+        pdf_fields = analyze_pdf_fields(pdf_path)
+        has_form_fields = bool(pdf_fields and "error" not in pdf_fields)
         generated_pdfs = {}
+        log = []
+        total_rows = len(df)
+        for index, row in df.iterrows():
+            progress((index + 1) / total_rows, f"ประมวลผลแถวที่ {index + 1}/{total_rows}")
+            # สร้างชื่อไฟล์
+            if filename_column and filename_column in df.columns and pd.notna(row[filename_column]):
+                safe_name = "".join(c for c in str(row[filename_column]) if c.isalnum() or c in (' ', '-', '_')).strip()
+                filename = f"{file_prefix}_{safe_name}.pdf"
+            else:
+                filename = f"{file_prefix}_{index + 1:03d}.pdf"
+            row_data = row.to_dict()
             try:
+                if use_form_fields and has_form_fields:
+                    # เติมฟอร์ม PDF ที่มีอยู่
+                    pdf_content = fill_pdf_form(pdf_path, row_data)
+                    status = "เติมฟอร์มสำเร็จ"
                 else:
+                    # สร้าง PDF ใหม่
+                    pdf_content = create_simple_pdf(row_data, filename)
+                    status = "สร้าง PDF ใหม่" if not has_form_fields else "สร้าง PDF ใหม่ (Fallback)"
+                generated_pdfs[filename] = pdf_content
+                log.append(f"✅ {filename}: {status}")
             except Exception as e:
+                log.append(f"❌ {filename}: เกิดข้อผิดพลาด - {e}")
+        if not generated_pdfs:
+            return None, "❌ ไม่สามารถสร้าง PDF ได้เลย\n" + "\n".join(log)
+        # สร้างไฟล์ ZIP
+        zip_buffer = io.BytesIO()
+        with zipfile.ZipFile(zip_buffer, 'w', zipfile.ZIP_DEFLATED) as zip_f:
+            for filename, pdf_content in generated_pdfs.items():
+                zip_f.writestr(filename, pdf_content)
+            zip_f.writestr("processing_log.txt", "\n".join(log))
+        zip_buffer.seek(0)
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        zip_filename = f"generated_pdfs_{timestamp}.zip"
+        temp_zip_path = os.path.join(tempfile.gettempdir(), zip_filename)
+        with open(temp_zip_path, 'wb') as f:
+            f.write(zip_buffer.getvalue())
+        result_message = f"✅ สร้าง PDF สำเร็จ {len(generated_pdfs)} ไฟล์!\nดูรายละเอียดใน processing_log.txt"
+        return temp_zip_path, result_message
+    except Exception as e:
+        return None, f"❌ เกิดข้อผิดพลาดร้ายแรง: {e}\n{traceback.format_exc()}"
+# ==============================================================================
+# ส่วนของฟังก์ชัน AI และ OCR (ทางเลือก)
+# ==============================================================================
+def init_sambanova_ai():
+    """Initialize SambaNova AI model client."""
+    if not SAMBANOVA_AI_ENABLED:
+        print("SambaNova AI is disabled.")
+        return None
+    try:
+        # ใช้ gradio_client.Client แทน gr.load ที่อาจมีปัญหา
+        client = Client("sambanova/Llama-3-8B-Instruct", hf_token="YOUR_HF_TOKEN") # ใส่ Hugging Face Token ของคุณ
+        print("SambaNova AI client initialized successfully.")
+        return client
+    except Exception as e:
+        print(f"Error initializing SambaNova AI: {e}")
+        return None
+def extract_text_from_image(image_file):
+    """Extract text from an image file using Tesseract OCR."""
+    if not AI_OCR_ENABLED or image_file is None:
+        return "", "OCR is not available or no image provided."
+    try:
+        image = Image.open(image_file.name)
+        # ตั้งค่า Tesseract ให้ตรวจจับทั้งภาษาไทยและอังกฤษ
+        custom_config = r'--oem 3 --psm 6 -l tha+eng'
+        text = pytesseract.image_to_string(image, config=custom_config)
+        return text.strip(), "Text extracted successfully."
+    except Exception as e:
+        return "", f"OCR Error: {e}. ตรวจสอบว่าติดตั้ง Tesseract Engine ถูกต้อง"
+def image_to_csv_with_ai(image_file, progress=gr.Progress()):
+    """Convert data from an image to a CSV file using OCR and AI for structuring."""
+    if not AI_OCR_ENABLED:
+        return None, "❌ ฟังก์ชันนี้ต้องการ AI/OCR dependencies"
+    if image_file is None:
+        return None, "❌ กรุณาอัพโหลดรูปภาพ"
+    progress(0.2, desc="กำลังอ่านข้อความจากรูปภาพ (OCR)...")
+    raw_text, ocr_status = extract_text_from_image(image_file)
+    if not raw_text:
+        return None, f"❌ ไม่พบข้อความในรูปภาพ: {ocr_status}"
+    progress(0.5, desc="กำลังใช้ AI จัดโครงสร้างข้อมูล...")
+    ai_client = init_sambanova_ai()
+    if not ai_client:
+        return None, "❌ ไม่สามารถเชื่อมต่อ AI Model ได้"
+    prompt = f"""
+From the following text, extract key-value pairs. The output should be only the data in 'key: value' format, one per line.
+Example:
+Name: John Doe
+Address: 123 Main St
+Date: 2024-01-15
+Text to process:
+---
+{raw_text}
+---
+"""
+    try:
+        # การเรียกใช้งาน API ของ gradio_client
+        result = ai_client.predict(message=prompt, api_name="/chat")
+        progress(0.8, desc="กำลังสร้างไฟล์ CSV...")
+        lines = result.strip().split('\n')
+        data = [line.split(':', 1) for line in lines if ':' in line]
+        if not data:
+            return None, "AI ไม่สามารถจัดโครงสร้างข้อมูลได้"
+        df = pd.DataFrame(data, columns=['Field', 'Value']).set_index('Field').T
+        csv_buffer = io.StringIO()
+        df.to_csv(csv_buffer, index=False, encoding='utf-8-sig')
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        temp_csv_path = os.path.join(tempfile.gettempdir(), f"extracted_data_{timestamp}.csv")
+        with open(temp_csv_path, 'w', encoding='utf-8-sig') as f:
+            f.write(csv_buffer.getvalue())
+        return temp_csv_path, "✅ แปลงรูปภาพเป็น CSV สำเร็จ"
     except Exception as e:
+        return None, f"❌ เกิดข้อผิดพลาดระหว่างประมวลผลด้วย AI: {e}"
+# ==============================================================================
+# ส่วนของ UI Analysis Functions
+# ==============================================================================
 def analyze_pdf_info(pdf_file):
+    """วิเคราะห์และแสดงข้อมูลสรุปของไฟล์ PDF บน UI"""
     if pdf_file is None:
         return "ยังไม่มีไฟล์ PDF"
     try:
+        reader = PdfReader(pdf_file.name)
+        info = f"📄 **ข้อมูล PDF:**\n- จำนวนหน้า: {len(reader.pages)}\n"
+        pdf_fields = analyze_pdf_fields(pdf_file.name)
+        if pdf_fields and "error" not in pdf_fields:
+            info += f"- **พบ Form Fields: {len(pdf_fields)} ช่อง** (จะใช้วิธีเติมฟอร์ม)\n"
+            info += "\n🏷️ **ตัวอย่างชื่อ Fields:**\n"
+            for name in list(pdf_fields.keys())[:10]:
+                info += f"  - `{name}`\n"
             if len(pdf_fields) > 10:
                 info += f"  - ... และอีก {len(pdf_fields) - 10} fields\n"
         else:
+            info += "- **ไม่พบ Form Fields** (จะใช้วิธีสร้าง PDF ใหม่ทับลงบนกระดาษเปล่า)\n"
         return info
     except Exception as e:
+        return f"❌ ไม่สามารถวิเคราะห์ PDF: {e}"
 def analyze_csv_info(csv_file):
+    """วิเคราะห์และแสดงข้อมูลสรุปของไฟล์ CSV และอัปเดต Dropdown"""
     if csv_file is None:
+        return "ยังไม่มีไฟล์ CSV", gr.update(choices=[], value=None)
     try:
         df, error = read_csv_safe(csv_file)
         if df is None:
+            return f"❌ ไม่สามารถอ่าน CSV: {error}", gr.update(choices=[], value=None)
+        info = f"📋 **ข้อมูล CSV:**\n- จำนวนแถว: {len(df)}\n- จำนวนคอลัมน์: {len(df.columns)}\n"
+        info += "\n📝 **รายชื่อคอลัมน์:**\n"
+        for col in df.columns[:15]:
+            info += f"  - `{col}`\n"
         if len(df.columns) > 15:
             info += f"  - ... และอีก {len(df.columns) - 15} คอลัมน์\n"
+        # อัปเดต Dropdown สำหรับเลือกคอลัมน์ชื่อไฟล์
+        return info, gr.update(choices=df.columns.tolist(), value=None)
     except Exception as e:
+        return f"❌ ไม่สามารถวิเคราะห์ CSV: {e}", gr.update(choices=[], value=None)
+# ==============================================================================
+# ส่วนของการสร้าง Gradio Interface
+# ==============================================================================
 def create_interface():
     with gr.Blocks(title="PDF Form Filler & Template Generator", theme=gr.themes.Soft()) as app:
+        gr.Markdown("# 📄 เครื่องมือจัดการ PDF จากข้อมูล CSV")
+        gr.Markdown("รองรับการ **สร้าง Template** จาก PDF, **เติมข้อมูล** จาก CSV, และ **แปลงรูปภาพเป็น CSV** ด้วย AI")
         with gr.Tabs():
+            # --- Tab 1: สร้าง Template ---
+            with gr.TabItem("🔄 1. สร้าง Template"):
+                gr.Markdown("## สร้าง CSV/JSON Template จาก PDF ที่มี Form Fields")
                 with gr.Row():
                     with gr.Column(scale=1):
+                        template_pdf = gr.File(label="📄 อัพโหลด PDF ต้นฉบับ", file_types=[".pdf"])
+                        num_sample_rows = gr.Slider(label="จำนวนแถวตัวอย่างใน CSV", minimum=1, maximum=50, value=5, step=1)
+                        generate_template_btn = gr.Button("🚀 สร้าง Template", variant="primary")
                     with gr.Column(scale=2):
+                        template_pdf_info = gr.Markdown("อัพโหลด PDF เพื่อดูข้อมูล...")
+                        template_result_file = gr.File(label="📦 ดาวน์โหลดไฟล์ Template (ZIP)", interactive=False)
+                        template_result_message = gr.Markdown()
+            # --- Tab 2: เติมข้อมูล PDF ---
+            with gr.TabItem("📝 2. เติมข้อมูล PDF"):
+                gr.Markdown("## เติมข้อมูลลง��น PDF จากไฟล์ CSV")
                 with gr.Row():
                     with gr.Column(scale=1):
+                        gr.Markdown("### 📂 1. อัพโหลดไฟล์")
+                        pdf_file = gr.File(label="📄 PDF Form ต้นฉบับ", file_types=[".pdf"])
+                        csv_file = gr.File(label="📊 CSV ข้อมูล", file_types=[".csv"])
+                        gr.Markdown("### ⚙️ 2. ตั้งค่า")
+                        use_form_fields = gr.Checkbox(label="พยายามเติมข้อมูลลงใน Form Fields ที่มีอยู่", value=True)
+                        file_prefix = gr.Textbox(label="คำนำหน้าชื่อไฟล์ (Prefix)", value="Document")
+                        filename_column = gr.Dropdown(label="เลือกคอลัมน์ที่จะใช้เป็นชื่อไฟล์ (ถ้ามี)", interactive=True)
+                        fill_form_btn = gr.Button("🚀 เริ่มเติมข้อมูล", variant="primary")
+                    with gr.Column(scale=2):
+                        pdf_info = gr.Markdown("อัพโหลด PDF เพื่อดูข้อมูล...")
+                        csv_info = gr.Markdown("อัพโหลด CSV เพื่อดูข้อมูล...")
+                        gr.Markdown("---")
+                        filled_result_file = gr.File(label="📦 ดาวน์โหลด PDF ทั้งหมด (ZIP)", interactive=False)
+                        filled_result_message = gr.Markdown()
+            # --- Tab 3: Image to CSV (AI) ---
+            with gr.TabItem("🖼️ 3. แปลงรูปภาพเป็น CSV (AI)"):
+                gr.Markdown("## ใช้ OCR และ AI เพื่อดึงข้อมูลจากรูปภาพและสร้างเป็นไฟล์ CSV")
+                with gr.Row():
+                    with gr.Column(scale=1):
+                        image_upload = gr.File(label="🖼️ อัพโหลดรูปภาพ (บิล, เอกสาร, ฯลฯ)", file_types=["image"])
+                        image_to_csv_btn = gr.Button("🤖 แปลงเป็น CSV", variant="primary", visible=AI_OCR_ENABLED)
+                        if not AI_OCR_ENABLED:
+                            gr.Markdown("⚠️ *ฟังก์ชันนี้ถูกปิดใช้งานเนื่องจากไม่พบ Library ที่จำเป็น (Pillow, OpenCV, Pytesseract)*")
+                    with gr.Column(scale=2):
+                        image_csv_output = gr.File(label="📄 ดาวน์โหลดไฟล์ CSV ที่ได้", interactive=False)
+                        image_csv_message = gr.Markdown()
+        # --- Event Handlers ---
+        template_pdf.change(fn=analyze_pdf_info, inputs=template_pdf, outputs=template_pdf_info)
+        generate_template_btn.click(
+            fn=create_template_files,
+            inputs=[template_pdf, num_sample_rows],
+            outputs=[template_result_file, template_result_message]
+        )
+        pdf_file.change(fn=analyze_pdf_info, inputs=pdf_file, outputs=pdf_info)
+        csv_file.change(fn=analyze_csv_info, inputs=csv_file, outputs=[csv_info, filename_column])
+        fill_form_btn.click(
+            fn=process_pdf_csv,
+            inputs=[pdf_file, csv_file, filename_column, file_prefix, use_form_fields],
+            outputs=[filled_result_file, filled_result_message]
+        )
+        if AI_OCR_ENABLED:
+            image_to_csv_btn.click(
+                fn=image_to_csv_with_ai,
+                inputs=[image_upload],
+                outputs=[image_csv_output, image_csv_message]
+            )
+    return app
+# --- Launch the application ---
+if __name__ == "__main__":
+    # ลองหา font ไทย ถ้าไม่มีจะได้ไม่ error ตอนสร้าง PDF
+    try:
+        from reportlab.pdfbase import pdfmetrics
+        from reportlab.pdfbase.ttfonts import TTFont
+        # สำหรับ Windows
+        pdfmetrics.registerFont(TTFont('THSarabunNew', 'C:/Windows/Fonts/THSARI.TTF'))
+        print("ลงทะเบียน Font 'THSarabunNew' สำห���ับ ReportLab สำเร็จ")
+    except:
+        print("คำเตือน: ไม่พบ Font 'THSarabunNew' ในระบบ อาจทำให้การสร้าง PDF ภาษาไทยมีปัญหา")
+        print("แนะนำให้ติดตั้งฟอนต์ TH SarabunPSK หรือปรับแก้ path ของฟอนต์ในโค้ด")
+    app = create_interface()
+    app.launch(debug=True)