Spaces:

ZORYE
/

CPS

Sleeping

App Files Files Community

ZORYE commited on Apr 27, 2025

Commit

f00ed24

verified ·

1 Parent(s): 2901036

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -19

app.py CHANGED Viewed

@@ -45,37 +45,40 @@ def add_watermark(image, text="gooditem gooditem gooditem gooditem gooditem"):
     combined = Image.alpha_composite(image.convert('RGBA'), watermark)
     return combined
-# 프로그램/아이템 정보 블록 추출
 def extract_info_block(article_text):
     pattern = r'(KBS2.*?<모델명>.*?)(?:\n\n|$)'
     match = re.search(pattern, article_text, re.DOTALL)
     if match:
         return match.group(1).strip()
     else:
         return None
-# 브랜드/모델명 여러 개 추출
 def extract_product_info(article_text):
     brand_match = re.search(r'<브랜드>[ \t]*([^\n]+)', article_text)
-    model_matches = re.findall(r'<모델명>[ \t]*([^\n]+)', article_text)
     brand = brand_match.group(1).strip() if brand_match else None
-    models = [m.strip() for m in model_matches] if model_matches else []
     result = []
-    if brand and models:
         brand_words = re.findall(r'[A-Za-z]+', brand)
-        selected_brand = ' '.join(brand_words[:2])  # 앞 2단어만
-        for model in models:
             search_query = f"{selected_brand} {model}"
             search_url = f"https://www.coupang.com/np/search?component=&q={search_query.replace(' ', '+')}"
             result.append((model, search_url))
     return result
-# 메인 처리 함수
 def process_url(tistory_url, output_dir):
     result = []
     try:
@@ -85,6 +88,7 @@ def process_url(tistory_url, output_dir):
         img_tags = soup.find_all('img')
         img_urls = [img['src'] for img in img_tags if 'src' in img.attrs]
         for idx, img_url in enumerate(img_urls):
             base_name = os.path.basename(img_url).split('?')[0]
             if base_name.startswith('new_ico'):
@@ -104,31 +108,33 @@ def process_url(tistory_url, output_dir):
             name, ext = os.path.splitext(base_name)
             save_path = os.path.join(output_dir, f"{name}_{idx+1}_processed.png")
             final_img.save(save_path)
-            # 다운로드 링크 추가
-            relative_path = save_path.replace("./", "/")
-            result.append(f"🖼️ [이미지 다운로드]({relative_path})")
         article_text = soup.get_text()
         info_block = extract_info_block(article_text)
-        product_infos = extract_product_info(article_text)
         if info_block:
             result.append("\n===== 프로그램 정보 블록 =====")
             result.append(info_block)
             result.append("================================\n")
-        if product_infos:
-            for model_name, search_url in product_infos:
-                result.append(f"🛍️ 아이템 : {model_name}")
-                result.append(f"🔗 쿠팡 링크: {search_url}")
     except Exception as e:
         result.append(f"❌ URL 처리 실패: {tistory_url} / 에러: {e}")
     return result
 # 여러 URL 처리
 def process_multiple_urls(urls_text, output_dir):
     urls = [url.strip() for url in urls_text.strip().splitlines() if url.strip()]

     combined = Image.alpha_composite(image.convert('RGBA'), watermark)
     return combined
 def extract_info_block(article_text):
     pattern = r'(KBS2.*?<모델명>.*?)(?:\n\n|$)'
     match = re.search(pattern, article_text, re.DOTALL)
     if match:
         return match.group(1).strip()
     else:
         return None
+# 제품명 추출 함수 수정 (여러 모델명 처리)
 def extract_product_info(article_text):
     brand_match = re.search(r'<브랜드>[ \t]*([^\n]+)', article_text)
     brand = brand_match.group(1).strip() if brand_match else None
+    model_matches = re.findall(r'<모델명>[ \t]*([^\n]+)', article_text)
     result = []
+    if brand and model_matches:
         brand_words = re.findall(r'[A-Za-z]+', brand)
+        selected_brand = ' '.join(brand_words[:2])
+        for model in model_matches:
+            model = model.strip()
             search_query = f"{selected_brand} {model}"
             search_url = f"https://www.coupang.com/np/search?component=&q={search_query.replace(' ', '+')}"
             result.append((model, search_url))
     return result
+# process_url 함수 수정 (모델명 여러개 대응)
 def process_url(tistory_url, output_dir):
     result = []
     try:
         img_tags = soup.find_all('img')
         img_urls = [img['src'] for img in img_tags if 'src' in img.attrs]
+        # 이미지 처리
         for idx, img_url in enumerate(img_urls):
             base_name = os.path.basename(img_url).split('?')[0]
             if base_name.startswith('new_ico'):
             name, ext = os.path.splitext(base_name)
             save_path = os.path.join(output_dir, f"{name}_{idx+1}_processed.png")
             final_img.save(save_path)
+            result.append(f"✔️ 저장 완료: {save_path}")
+        # 텍스트 추출
         article_text = soup.get_text()
+        # 프로그램 정보 블록 추출
         info_block = extract_info_block(article_text)
+        # 제품 정보 추출 (여러 모델명 처리)
+        item_info_list = extract_product_info(article_text)
+        # 정리된 출력 포맷
         if info_block:
             result.append("\n===== 프로그램 정보 블록 =====")
             result.append(info_block)
             result.append("================================\n")
+        for model_name, search_url in item_info_list:
+            result.append(f"🛍️ 아이템 : {model_name}")
+            result.append(f"🔗 쿠팡 링크: {search_url}")
     except Exception as e:
         result.append(f"❌ URL 처리 실패: {tistory_url} / 에러: {e}")
     return result
 # 여러 URL 처리
 def process_multiple_urls(urls_text, output_dir):
     urls = [url.strip() for url in urls_text.strip().splitlines() if url.strip()]