Spaces:

ABDALLALSWAITI
/

htmlpdf

Sleeping

App Files Files Community

ABDALLALSWAITI commited on Oct 16, 2025

Commit

e0bb645

verified ·

1 Parent(s): 1fce321

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +48 -37

src/streamlit_app.py CHANGED Viewed

@@ -20,8 +20,9 @@ def convert_html_to_pdf(html_content, aspect_ratio):
         aspect_ratio: One of "16:9", "1:1", or "9:16"
     Returns:
-        Path to generated PDF file or error message
     """
     try:
         # Create temporary directory for processing
         temp_dir = tempfile.mkdtemp()
@@ -31,12 +32,17 @@ def convert_html_to_pdf(html_content, aspect_ratio):
         with open(html_file, 'w', encoding='utf-8') as f:
             f.write(html_content)
         # Run Node.js script to convert HTML to PDF
         result = subprocess.run(
-            ['node', 'puppeteer_pdf.js', html_file, aspect_ratio],
             capture_output=True,
             text=True,
-            timeout=60
         )
         if result.returncode != 0:
@@ -48,18 +54,22 @@ def convert_html_to_pdf(html_content, aspect_ratio):
         if not os.path.exists(pdf_file):
             return None, "PDF file was not generated"
-        # Copy PDF to a permanent location
-        output_pdf = os.path.join(tempfile.gettempdir(), f"output_{os.getpid()}.pdf")
-        shutil.copy(pdf_file, output_pdf)
         # Clean up temporary directory
         shutil.rmtree(temp_dir, ignore_errors=True)
-        return output_pdf, None
     except subprocess.TimeoutExpired:
         return None, "Error: PDF conversion timed out (60 seconds)"
     except Exception as e:
         return None, f"Error: {str(e)}"
 # Page header
@@ -80,7 +90,8 @@ with tab1:
         uploaded_file = st.file_uploader(
             "Choose an HTML file",
             type=['html', 'htm'],
-            key="file_uploader"
         )
         aspect_ratio_file = st.radio(
@@ -96,30 +107,34 @@ with tab1:
     with col2:
         if convert_file_btn:
             if uploaded_file is not None:
-                with st.spinner("Converting HTML to PDF..."):
-                    # Read uploaded file
-                    html_content = uploaded_file.read().decode('utf-8')
-                    # Convert to PDF
-                    pdf_path, error = convert_html_to_pdf(html_content, aspect_ratio_file)
-                    if error:
-                        st.error(error)
-                    else:
-                        st.success("✅ PDF generated successfully!")
-                        # Read PDF file
-                        with open(pdf_path, 'rb') as f:
-                            pdf_data = f.read()
-                        # Download button
-                        st.download_button(
-                            label="⬇️ Download PDF",
-                            data=pdf_data,
-                            file_name="converted.pdf",
-                            mime="application/pdf",
-                            use_container_width=True
-                        )
             else:
                 st.warning("Please upload an HTML file first.")
@@ -176,21 +191,17 @@ with tab2:
             if html_code and html_code.strip():
                 with st.spinner("Converting HTML to PDF..."):
                     # Convert to PDF
-                    pdf_path, error = convert_html_to_pdf(html_code, aspect_ratio_text)
                     if error:
                         st.error(error)
                     else:
                         st.success("✅ PDF generated successfully!")
-                        # Read PDF file
-                        with open(pdf_path, 'rb') as f:
-                            pdf_data = f.read()
-                        # Download button
                         st.download_button(
                             label="⬇️ Download PDF",
-                            data=pdf_data,
                             file_name="converted.pdf",
                             mime="application/pdf",
                             use_container_width=True

         aspect_ratio: One of "16:9", "1:1", or "9:16"
     Returns:
+        Tuple of (pdf_bytes, error_message)
     """
+    temp_dir = None
     try:
         # Create temporary directory for processing
         temp_dir = tempfile.mkdtemp()
         with open(html_file, 'w', encoding='utf-8') as f:
             f.write(html_content)
+        # Get the path to puppeteer_pdf.js (it's in parent directory)
+        script_dir = os.path.dirname(os.path.abspath(__file__))
+        puppeteer_script = os.path.join(os.path.dirname(script_dir), 'puppeteer_pdf.js')
         # Run Node.js script to convert HTML to PDF
         result = subprocess.run(
+            ['node', puppeteer_script, html_file, aspect_ratio],
             capture_output=True,
             text=True,
+            timeout=60,
+            cwd=os.path.dirname(script_dir)
         )
         if result.returncode != 0:
         if not os.path.exists(pdf_file):
             return None, "PDF file was not generated"
+        # Read PDF file into memory
+        with open(pdf_file, 'rb') as f:
+            pdf_bytes = f.read()
         # Clean up temporary directory
         shutil.rmtree(temp_dir, ignore_errors=True)
+        return pdf_bytes, None
     except subprocess.TimeoutExpired:
+        if temp_dir:
+            shutil.rmtree(temp_dir, ignore_errors=True)
         return None, "Error: PDF conversion timed out (60 seconds)"
     except Exception as e:
+        if temp_dir:
+            shutil.rmtree(temp_dir, ignore_errors=True)
         return None, f"Error: {str(e)}"
 # Page header
         uploaded_file = st.file_uploader(
             "Choose an HTML file",
             type=['html', 'htm'],
+            key="file_uploader",
+            help="Upload an HTML file (max 200MB)"
         )
         aspect_ratio_file = st.radio(
     with col2:
         if convert_file_btn:
             if uploaded_file is not None:
+                try:
+                    with st.spinner("Converting HTML to PDF..."):
+                        # Read uploaded file with proper encoding handling
+                        try:
+                            html_content = uploaded_file.read().decode('utf-8')
+                        except UnicodeDecodeError:
+                            # Try with latin-1 encoding if utf-8 fails
+                            uploaded_file.seek(0)
+                            html_content = uploaded_file.read().decode('latin-1')
+                        # Convert to PDF
+                        pdf_bytes, error = convert_html_to_pdf(html_content, aspect_ratio_file)
+                        if error:
+                            st.error(error)
+                        else:
+                            st.success("✅ PDF generated successfully!")
+                            # Download button with PDF bytes
+                            st.download_button(
+                                label="⬇️ Download PDF",
+                                data=pdf_bytes,
+                                file_name=f"{uploaded_file.name.replace('.html', '.pdf').replace('.htm', '.pdf')}",
+                                mime="application/pdf",
+                                use_container_width=True
+                            )
+                except Exception as e:
+                    st.error(f"Error processing file: {str(e)}")
             else:
                 st.warning("Please upload an HTML file first.")
             if html_code and html_code.strip():
                 with st.spinner("Converting HTML to PDF..."):
                     # Convert to PDF
+                    pdf_bytes, error = convert_html_to_pdf(html_code, aspect_ratio_text)
                     if error:
                         st.error(error)
                     else:
                         st.success("✅ PDF generated successfully!")
+                        # Download button with PDF bytes
                         st.download_button(
                             label="⬇️ Download PDF",
+                            data=pdf_bytes,
                             file_name="converted.pdf",
                             mime="application/pdf",
                             use_container_width=True