Spaces:

orgoflu
/

moro_text

Sleeping

orgoflu commited on Sep 10, 2025

Commit

908d904

verified ·

1 Parent(s): 3bd5481

app.py

Files changed (1) hide show

app.py ADDED Viewed

+import gradio as gr
+import trafilatura
+import requests
+def extract(url):
+    headers = {"User-Agent": "Mozilla/5.0"}
+    try:
+        r = requests.get(url, headers=headers, timeout=10)
+        r.raise_for_status()
+        text = trafilatura.extract(r.text)
+        return text or "본문을 추출할 수 없습니다."
+    except requests.exceptions.Timeout:
+        return "요청이 시간 초과되었습니다."
+    except requests.exceptions.RequestException as e:
+        return f"요청 실패: {e}"
+    except Exception as e:
+        return f"에러 발생: {e}"
+iface = gr.Interface(
+    fn=extract,
+    inputs=gr.Textbox(label="URL 입력", placeholder="https://example.com"),
+    outputs=gr.Textbox(label="추출된 본문", lines=20),
+    title="본문 추출기",
+    description="웹페이지 URL을 입력하면 본문만 추출합니다."
+)
+if __name__ == "__main__":
+    iface.launch()