Spaces:

Hyounggoo
/

kairo

Runtime error

App Files Files Community

Hyounggoo commited on Jun 3, 2025

Commit

0dff0c6

verified ·

1 Parent(s): f38f577

Upload 4 files

Browse files

Files changed (4) hide show

KAIRO_Checklist_Config.json +28 -0
README.md +4 -4
app.py +41 -108
requirements.txt +3 -4

KAIRO_Checklist_Config.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "checklist_korean": [
+    "맞춤법 (Orthography)",
+    "띄어쓰기 (Spacing Rules)",
+    "문법 오류 (Grammatical Errors)",
+    "표준어 규정 위반 (Standard Language Regulation)",
+    "외래어 표기법 위반 (Loanword Orthography)",
+    "문장 구조 오류 (Sentence Structure Error)",
+    "어휘 적절성 (Lexical Appropriateness)",
+    "중복어/군더더기 제거 (Redundancy Elimination)",
+    "오탈자 (Typographical Errors)",
+    "문장 부호 사용 (Punctuation Usage)",
+    "어법 오류 (Usage Error)",
+    "논리적 일관성 (Logical Coherence)",
+    "형식적 오류 (Formatting Consistency)"
+  ],
+  "checklist_english": [
+    "Spelling (철자 오류)",
+    "Grammar (문법 오류)",
+    "Capitalization (대소문자 오류)",
+    "Subject-Verb Agreement (주어-동사 일치)",
+    "Article Usage (관사의 적절성)",
+    "Tense Consistency (시제 일관성)",
+    "Word Choice (어휘 선택)",
+    "Redundancy (중복 표현)",
+    "Tone (문체 및 일관성)"
+  ]
+}

README.md CHANGED Viewed

@@ -1,3 +1,4 @@
 ---
 title: "KAIRO.ai"
 emoji: "🧠"
@@ -9,7 +10,6 @@ app_file: app.py
 pinned: false
 ---
-# KAIRO.ai - 다중 OCR 정확도 비교 및 병합
-- 여러 OCR 엔진 결과 비교
-- 유사도 점수 표시
-- 최적 후보 자동 선택

 ---
 title: "KAIRO.ai"
 emoji: "🧠"
 pinned: false
 ---
+# KAIRO.ai
+AI 기반 PNG 이미지 교정 (OCR + GPT-4 Turbo + PPT 생성) 시스템입니다.

app.py CHANGED Viewed

@@ -1,119 +1,52 @@
 import streamlit as st
 from PIL import Image
-import pytesseract
-import easyocr
-from paddleocr import PaddleOCR
-import numpy as np
-from pptx import Presentation
-from pptx.util import Inches, Pt
-import os
 import io
-import tempfile
-import zipfile
-from difflib import SequenceMatcher
-st.set_page_config(layout="centered")
-st.markdown("<h1 style='text-align: center; font-size: 48px;'>🧠 KAIRO.ai - OCR 정확도 비교 & 병합</h1>", unsafe_allow_html=True)
-st.sidebar.header("OCR 엔진 선택")
-ocr_engines = st.sidebar.multiselect("사용할 OCR 엔진을 선택하세요", ["Tesseract", "EasyOCR", "PaddleOCR"], default=["Tesseract", "EasyOCR"])
-uploaded_files = st.file_uploader("PNG 또는 ZIP 파일 업로드", type=["png", "zip"], accept_multiple_files=True)
-def normalize(text):
-    return text.replace(" ", "").replace("\n", "").lower()
-def score_similarity(a, b):
-    return SequenceMatcher(None, a, b).ratio()
-def extract_images(file):
-    images = []
-    if file.name.endswith(".zip"):
-        with tempfile.TemporaryDirectory() as tmpdir:
-            zip_path = os.path.join(tmpdir, file.name)
-            with open(zip_path, "wb") as f:
-                f.write(file.getbuffer())
-            with zipfile.ZipFile(zip_path, 'r') as zip_ref:
-                zip_ref.extractall(tmpdir)
-            for root, _, files in os.walk(tmpdir):
-                for name in files:
-                    if name.lower().endswith(".png"):
-                        images.append(Image.open(os.path.join(root, name)).convert("RGB"))
-    else:
-        images = [Image.open(file).convert("RGB")]
-    return images
-def run_tesseract(img):
-    return pytesseract.image_to_string(img, lang="kor+eng")
-def run_easyocr(img):
-    reader = easyocr.Reader(['ko', 'en'], gpu=False)
-    result = reader.readtext(np.array(img), detail=0)
-    return "\n".join(result)
-def run_paddleocr(img):
-    ocr = PaddleOCR(use_angle_cls=True, lang='korean')
-    result = ocr.ocr(np.array(img), cls=True)
-    return "\n".join([line[1][0] for block in result for line in block])
-def create_ppt(results):
-    prs = Presentation()
-    for idx, (img, all_texts, best_text, best_engine) in enumerate(results):
-        slide = prs.slides.add_slide(prs.slide_layouts[5])
-        title = slide.shapes.title
-        title.text = f"파일 {idx+1} (최적 엔진: {best_engine})"
-        left = Inches(0.5)
-        top = Inches(1.0)
-        width = Inches(8.5)
-        height = Inches(5.5)
-        txBox = slide.shapes.add_textbox(left, top, width, height)
-        tf = txBox.text_frame
-        for engine, text in all_texts.items():
-            p = tf.add_paragraph()
-            p.text = f"[{engine}]\n{text}\n"
-            p.font.size = Pt(14)
-        p = tf.add_paragraph()
-        p.text = f"[최종 선택 결과]\n{best_text}"
-        p.font.size = Pt(16)
-    return prs
 if uploaded_files:
-    results = []
-    for file in uploaded_files:
-        images = extract_images(file)
-        for img in images:
-            ocr_texts = {}
-            if "Tesseract" in ocr_engines:
-                ocr_texts["Tesseract"] = run_tesseract(img)
-            if "EasyOCR" in ocr_engines:
-                ocr_texts["EasyOCR"] = run_easyocr(img)
-            if "PaddleOCR" in ocr_engines:
-                ocr_texts["PaddleOCR"] = run_paddleocr(img)
-            st.image(img, caption="업로드 이미지", use_column_width=True)
-            # 비교 기준: 첫 엔진을 기준으로 유사도 계산
-            base_engine = list(ocr_texts.keys())[0]
-            base_text = normalize(ocr_texts[base_engine])
-            scores = {engine: score_similarity(base_text, normalize(txt)) for engine, txt in ocr_texts.items()}
-            best_engine = max(scores, key=scores.get)
-            best_text = ocr_texts[best_engine]
-            st.markdown("#### OCR 결과 비교")
-            for engine, text in ocr_texts.items():
-                st.text_area(f"{engine} 결과", text, height=150)
-            st.markdown("#### 유사도 점수")
-            for engine, score in scores.items():
-                st.write(f"{engine}: {round(score*100, 2)}%")
-            st.success(f"✅ 최적 후보: {best_engine}")
-            results.append((img, ocr_texts, best_text, best_engine))
-    ppt = create_ppt(results)
-    ppt_path = "/mnt/data/KAIRO_OCR_최적결과.pptx"
-    ppt.save(ppt_path)
-    with open(ppt_path, "rb") as f:
-        st.download_button("📥 PPT 다운로드", data=f.read(), file_name="KAIRO_OCR_최적결과.pptx")

 import streamlit as st
 from PIL import Image
 import io
+st.set_page_config(page_title="KAIRO.ai", layout="wide")
+# 다크모드 토글 (우측 상단)
+col1, col2 = st.columns([8, 1])
+with col2:
+    dark_mode = st.toggle("🌙", help="다크 모드 전환")
+# 중앙 정렬 타이틀, 확대
+st.markdown(
+    "<h1 style='text-align: center; font-size: 3em;'>🧠 KAIRO.ai</h1>",
+    unsafe_allow_html=True
+)
+# 다크모드 스타일 적용
+if dark_mode:
+    st.markdown("""
+        <style>
+        html, body, .stApp {
+            background-color: #1e1e1e;
+            color: #f0f0f0;
+        }
+        </style>
+    """, unsafe_allow_html=True)
+ocr_engines = st.multiselect("🧠 OCR 엔진 선택 (중복 가능)", ["Tesseract", "EasyOCR", "PaddleOCR"], default=["Tesseract"])
+checklist = st.multiselect("🔍 검수 항목 선택", ["오탈자", "띄어쓰기", "문법", "어휘"], default=["오탈자", "띄어쓰기"])
+uploaded_files = st.file_uploader("📎 PNG 업로드 (제한 없음)", type=["png"], accept_multiple_files=True)
+api_key = st.text_input("🔐 OpenAI API Key", type="password")
+st.markdown("---")
 if uploaded_files:
+    st.success(f"{len(uploaded_files)}장 업로드 완료 ✅")
+    estimated_tokens_per_file = 400
+    total_tokens = estimated_tokens_per_file * len(uploaded_files)
+    cost_estimate = total_tokens * 0.01 / 1000
+    st.markdown("### 💰 예상 비용 안내 (GPT-4 Turbo 기준)")
+    st.markdown(f"- 예상 토큰 수: **{total_tokens} tokens**")
+    st.markdown(f"- 예상 비용: **${cost_estimate:.4f}**")
+    st.info("👉 OCR 실행 중...")
+    st.info("👉 GPT 교정 진행 중...")
+    st.info("👉 PPT 생성 중...")
+    st.warning("※ 이 기능은 데모용이며 실제 OCR/GPT 연동은 다음 버전에서 작동합니다.")

requirements.txt CHANGED Viewed

@@ -1,7 +1,6 @@
 streamlit
 pytesseract
-easyocr
-paddleocr
-python-pptx
 Pillow
-numpy

 streamlit
 pytesseract
 Pillow
+python-pptx
+openai