Spaces:

orgoflu
/

moro_text_2

Sleeping

App Files Files Community

orgoflu commited on Sep 11, 2025

Commit

dfdac42

verified ·

1 Parent(s): af6f11c

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -10

app.py CHANGED Viewed

@@ -12,15 +12,15 @@ import re
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
-# ===== 지원 모델 목록 =====
 MODEL_OPTIONS = {
-    "Qwen2.5-1.5B-Instruct (품질↑, 느림)": "Qwen/Qwen2.5-1.5B-Instruct",
-    "Qwen2.5-0.5B-Instruct (빠름, 경량)": "Qwen/Qwen2.5-0.5B-Instruct",
-    "Phi-3-Mini-4K-Instruct (빠름, 경량)": "microsoft/Phi-3-mini-4k-instruct",
-    "Mistral-7B-Instruct-v0.3": "mistralai/Mistral-7B-Instruct-v0.3"
 }
-# ===== 모델 로드 함수 =====
 def load_model(model_name):
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForCausalLM.from_pretrained(
@@ -42,7 +42,7 @@ def remove_duplicates(sentences):
             result.append(s_clean)
     return result
-# ===== 자동요약 (TextRank) =====
 def summarize_text(text):
     text = clean_text(text)
     length = len(text)
@@ -75,7 +75,7 @@ def summarize_text(text):
     summary_list.sort(key=lambda s: text.find(s))
     return summary_list
-# ===== LLM 자동재작성 =====
 def rewrite_with_llm(sentences, model_choice):
     model_name = MODEL_OPTIONS[model_choice]
     llm_pipeline = load_model(model_name)
@@ -129,14 +129,14 @@ iface = gr.Interface(
     fn=extract_summarize_paraphrase,
     inputs=[
         gr.Textbox(label="URL 입력", placeholder="https://example.com"),
-        gr.Dropdown(choices=list(MODEL_OPTIONS.keys()), value="Qwen2.5-0.5B-Instruct (빠름, 경량)", label="재작성 모델 선택")
     ],
     outputs=[
         gr.Markdown(label="추출된 본문"),
         gr.Textbox(label="자동 요약", lines=5),
         gr.Textbox(label="자동 재작성 (LLM)", lines=5)
     ],
-    title="한국어 본문 추출 + 자동 요약 + LLM 재작성 (모델 선택 가능)",
     description="본문은 TextRank로 요약하고, 재작성은 선택한 Hugging Face Hub LLM으로 처리합니다."
 )

 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
+# ===== 비교용 모델 목록 =====
 MODEL_OPTIONS = {
+    "Qwen2.5-1.5B-Instruct (기본)": "Qwen/Qwen2.5-1.5B-Instruct",
+    "DeepSeek-R1-Distill-Qwen-1.5B": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
+    "SOLAR-1.5B-Instruct": "upstage/SOLAR-1.5B-Instruct",
+    "Gemma-2-2B-it": "google/gemma-2-2b-it"
 }
+# ===== 모델 로드 =====
 def load_model(model_name):
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForCausalLM.from_pretrained(
             result.append(s_clean)
     return result
+# ===== 자동요약 =====
 def summarize_text(text):
     text = clean_text(text)
     length = len(text)
     summary_list.sort(key=lambda s: text.find(s))
     return summary_list
+# ===== LLM 재작성 =====
 def rewrite_with_llm(sentences, model_choice):
     model_name = MODEL_OPTIONS[model_choice]
     llm_pipeline = load_model(model_name)
     fn=extract_summarize_paraphrase,
     inputs=[
         gr.Textbox(label="URL 입력", placeholder="https://example.com"),
+        gr.Dropdown(choices=list(MODEL_OPTIONS.keys()), value="Qwen2.5-1.5B-Instruct (기본)", label="재작성 모델 선택")
     ],
     outputs=[
         gr.Markdown(label="추출된 본문"),
         gr.Textbox(label="자동 요약", lines=5),
         gr.Textbox(label="자동 재작성 (LLM)", lines=5)
     ],
+    title="한국어 본문 추출 + 자동 요약 + LLM 재작성 (모델 비교)",
     description="본문은 TextRank로 요약하고, 재작성은 선택한 Hugging Face Hub LLM으로 처리합니다."
 )