Spaces:

arithescientist
/

text2speech

Runtime error

arithescientist commited on Jun 3, 2022

Commit

5cddb5b

1 Parent(s): 0f029ca

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+#**************** IMPORT PACKAGES ********************
+import gradio as gr
+import numpy as np
+import pytesseract as pt
+import pdf2image
+import os
+import tempfile
+from fpdf import FPDF
+import re
+import pdfkit
+import yake
+from zipfile import ZipFile
+from gtts import gTTS
+from pdfminer.high_level import extract_text
+def pdf_to_text(text, PDF):
+   if text == "":
+      # The setup of huggingface.co
+      file_obj = PDF
+      #n = int(Percent.replace('%', ''))
+      text = extract_text(file_obj.name)
+      outpit_text = text
+   else:
+      output_text = text
+      # Generate Summary
+      summary_ids = model.generate(inputs["input_ids"], num_beams=2,min_length=Min, max_length=Min+1000)
+      output_text  = tokenizer.batch_decode(summary_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False)[0]
+   pdf = FPDF()
+   pdf.add_page()
+   pdf.set_font("Times", size = 12)
+  # open the text file in read mode
+   f = output_text
+  # insert the texts in pdf
+   pdf.multi_cell(190, 10, txt = f, align = 'C')
+  # save the pdf with name .pdf
+   pdf.output("text.pdf")
+   myobj = gTTS(text=output_text, lang='en', slow=False)
+   myobj.save("audio.wav")
+   return  "audio.wav", output_text, "text.pdf"
+  #  return path
+    #pageObject.extractText()
+iface = gr.Interface(fn = pdf_to_text,
+   inputs =["text", "file"], outputs=["audio","text", "file"] )
+if __name__ == "__main__":
+    iface.launch(share=True)