Spaces:

JaishnaCodz
/

BlogReviewer

Sleeping

JaishnaCodz commited on Jul 15, 2025

Commit

2c83941

verified ·

1 Parent(s): 16e02f2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import gradio as gr
-from newspaper import Article
 from transformers import pipeline
 import pytesseract
 from PIL import Image
@@ -20,14 +20,13 @@ def extract_text_from_image_url(img_url):
         return f"❌ OCR Error: {e}"
 # Extract blog
-def extract_text_from_url(url):
-    try:
-        article = Article(url)
-        article.download()
-        article.parse()
-        return article.text
-    except Exception as e:
-        return f"❌ Blog Error: {e}"
 # Review line-by-line
 def review_lines(text):

 import gradio as gr
+import trafilatura
 from transformers import pipeline
 import pytesseract
 from PIL import Image
         return f"❌ OCR Error: {e}"
 # Extract blog
+def extract_text_from_url(url):
+    downloaded = trafilatura.fetch_url(url)
+    if downloaded:
+        return trafilatura.extract(downloaded)
+    else:
+        return "❌ Blog Error: Could not fetch content from the URL."
 # Review line-by-line
 def review_lines(text):