Spaces:

Heartsync
/

EXAM-GEN

Running

App Files Files Community

seawolf2357 commited on Jan 15

Commit

ff48136

verified ·

1 Parent(s): 78bdfe0

Update app.py

Browse files

Files changed (1) hide show

app.py +218 -32

app.py CHANGED Viewed

@@ -135,6 +135,30 @@ footer, .footer, .gradio-container footer, .built-with, [class*="footer"], .grad
     box-shadow: 2px 2px 0 #1F2937;
 }
 .gr-panel, .gr-box, .gr-form, .block, .gr-group {
     background: #FFF !important;
     border: 3px solid #1F2937 !important;
@@ -225,6 +249,58 @@ textarea:focus, input[type="text"]:focus {
     font-size: 1.5rem;
 }
 label, .gr-input-label, .gr-block-label {
     color: #1F2937 !important;
     font-family: 'Comic Neue', cursive !important;
@@ -799,14 +875,14 @@ def convert_hwp_to_markdown(input_path: str) -> tuple:
 # ============== LLM API ==============
 def call_groq_api_stream(messages: List[Dict], api_key: str) -> Generator[str, None, None]:
     if not api_key:
-        yield "❌ Groq API 키가 설정되지 않았습니다."
         return
     try:
         response = requests.post(
             "https://api.groq.com/openai/v1/chat/completions",
             headers={"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"},
             json={
-                "model": "meta-llama/llama-4-scout-17b-16e-instruct",
                 "messages": messages,
                 "temperature": 0.7,
                 "max_tokens": 8192,
@@ -833,7 +909,7 @@ def call_groq_api_stream(messages: List[Dict], api_key: str) -> Generator[str, N
 def call_fireworks_api_stream(messages: List[Dict], image_base64: str, mime_type: str, api_key: str) -> Generator[str, None, None]:
     if not api_key:
-        yield "❌ Fireworks API 키가 설정되지 않았습니다."
         return
     try:
         formatted_messages = [{"role": m["role"], "content": m["content"]} for m in messages[:-1]]
@@ -849,7 +925,7 @@ def call_fireworks_api_stream(messages: List[Dict], image_base64: str, mime_type
             headers={"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"},
             json={
                 "model": "accounts/fireworks/models/qwen3-vl-235b-a22b-thinking",
-                "max_tokens": 4096,
                 "temperature": 0.6,
                 "messages": formatted_messages,
                 "stream": True
@@ -885,25 +961,28 @@ def process_file(file_path: str) -> tuple:
     if is_hwp_file(file_path) or is_hwpx_file(file_path):
         text, error = extract_text_from_hwp_or_hwpx(file_path)
         if text and len(text.strip()) > 20:
-            return "text", f"[📄 한글 문서: {filename}]\n\n{text}", None
         return "error", f"한글 문서 추출 실패: {error}", None
     if is_pdf_file(file_path):
         text = extract_text_from_pdf(file_path)
         if text:
-            return "text", f"[📑 PDF 문서: {filename}]\n\n{text}", None
         return "error", "PDF 추출 실패", None
     if is_text_file(file_path):
         text = extract_text_from_txt(file_path)
         if text:
-            return "text", f"[📝 텍스트 파일: {filename}]\n\n{text}", None
         return "error", "텍스트 읽기 실패", None
     return "unsupported", f"지원하지 않는 형식: {filename}", None
 def chat_response(message: str, history: List[Dict], file: Optional[str],
-                  session_id: str, groq_key: str, fireworks_key: str) -> Generator[tuple, None, None]:
     if history is None:
         history = []
     if not message.strip() and not file:
@@ -914,10 +993,12 @@ def chat_response(message: str, history: List[Dict], file: Optional[str],
     file_type, file_content, file_mime = None, None, None
     file_info = None
     if file:
         file_type, file_content, file_mime = process_file(file)
-        file_info = json.dumps({"type": file_type, "filename": os.path.basename(file)})
         if file_type == "error":
             history = history + [
@@ -934,41 +1015,104 @@ def chat_response(message: str, history: List[Dict], file: Optional[str],
             yield history, session_id
             return
     user_msg = message
     if file:
-        filename = os.path.basename(file)
         user_msg = f"📎 {filename}\n\n{message}" if message else f"📎 {filename}"
     history = history + [{"role": "user", "content": user_msg}, {"role": "assistant", "content": ""}]
     yield history, session_id
     db_messages = get_session_messages(session_id, limit=10)
-    api_messages = [{
-        "role": "system",
-        "content": "당신은 도움이 되는 AI 어시스턴트입니다. 한국어로 자연스럽게 대화하며, 파일이 첨부되면 내용을 상세히 분석하여 답변합니다. 문서의 핵심 내용을 파악하고, 사용자의 질문에 정확하게 답변하세요."
-    }]
     for m in db_messages:
         api_messages.append({"role": m["role"], "content": m["content"]})
-    current_content = message or ""
     if file_type == "text" and file_content:
-        current_content = f"{file_content}\n\n사용자 질문: {message}" if message else f"{file_content}\n\n위 문서 내용을 요약해주세요."
     api_messages.append({"role": "user", "content": current_content})
     full_response = ""
     if file_type == "image":
-        for chunk in call_fireworks_api_stream(api_messages, file_content, file_mime, fireworks_key):
             full_response += chunk
             history[-1] = {"role": "assistant", "content": full_response}
             yield history, session_id
     else:
-        for chunk in call_groq_api_stream(api_messages, groq_key):
             full_response += chunk
             history[-1] = {"role": "assistant", "content": full_response}
             yield history, session_id
     save_message(session_id, "user", current_content, file_info)
     save_message(session_id, "assistant", full_response)
@@ -1056,7 +1200,7 @@ def convert_hwp(file, output_format, progress=gr.Progress()):
                     f.write(text)
             ext = ".txt"
-        elif output_format == "Markdown":
             text, error = convert_hwp_to_markdown(input_path)
             if text:
                 output_path = os.path.join(tmp_dir, "output.md")
@@ -1146,6 +1290,14 @@ with gr.Blocks(title="HWP AI 어시스턴트", css=COMIC_CSS, delete_cache=(60,
     </div>
     """)
     session_state = gr.State("")
     with gr.Tabs():
@@ -1167,12 +1319,6 @@ with gr.Blocks(title="HWP AI 어시스턴트", css=COMIC_CSS, delete_cache=(60,
             with gr.Row():
                 with gr.Column(scale=1):
-                    gr.HTML('<div class="info-box">⚙️ <b>설정</b></div>')
-                    with gr.Accordion("🔑 API 키 설정", open=True):
-                        groq_key = gr.Textbox(label="Groq API Key", type="password", value=GROQ_API_KEY, placeholder="gsk_...")
-                        fireworks_key = gr.Textbox(label="Fireworks API Key", type="password", value=FIREWORKS_API_KEY, placeholder="fw_...")
                     gr.HTML("""
                     <div class="info-box">
                         📁 <b>지원 파일 형식</b><br><br>
@@ -1220,6 +1366,45 @@ with gr.Blocks(title="HWP AI 어시스턴트", css=COMIC_CSS, delete_cache=(60,
             </div>
             """)
             with gr.Row():
                 with gr.Column():
                     gr.HTML('<div class="info-box">📤 <b>파일 업로드</b></div>')
@@ -1229,8 +1414,8 @@ with gr.Blocks(title="HWP AI 어시스턴트", css=COMIC_CSS, delete_cache=(60,
                         elem_classes=["upload-box"]
                     )
                     format_select = gr.Radio(
-                        ["HTML", "ODT (OpenDocument)", "TXT (텍스트)", "Markdown", "XML"],
-                        value="TXT (텍스트)",
                         label="📋 변환 형식"
                     )
                     convert_btn = gr.Button("🔄 변환하기", variant="primary", size="lg")
@@ -1245,7 +1430,7 @@ with gr.Blocks(title="HWP AI 어시스턴트", css=COMIC_CSS, delete_cache=(60,
             gr.HTML("""
             <div class="info-box">
-                ℹ️ <b>안내</b>: HWPX 파일은 TXT, Markdown, XML 변환만 지원됩니다.
             </div>
             """)
@@ -1255,20 +1440,21 @@ with gr.Blocks(title="HWP AI 어시스턴트", css=COMIC_CSS, delete_cache=(60,
         <p style="font-family:'Bangers',cursive;font-size:1.8rem;letter-spacing:2px">📄 HWP AI 어시스턴트 🤖</p>
         <p>AI가 HWP 파일을 읽고, 보고, 말하며, 생각하고 기억합니다!</p>
         <p>📖 READ • 👁️ SEE • 💬 SPEAK • 🧠 THINK • 💾 MEMORY</p>
         <p style="margin-top:10px"><a href="https://www.humangen.ai" target="_blank" style="color:#FACC15;text-decoration:none;font-weight:bold;">🏠 www.humangen.ai</a></p>
     </div>
     """)
     # ============== 이벤트 핸들러 ==============
-    def on_submit(msg, hist, f, sid, gk, fk):
         if hist is None:
             hist = []
-        for r in chat_response(msg, hist, f, sid, gk, fk):
             yield r[0], r[1], "", None
-    submit_btn.click(on_submit, [msg_input, chatbot, file_upload, session_state, groq_key, fireworks_key],
                      [chatbot, session_state, msg_input, file_upload])
-    msg_input.submit(on_submit, [msg_input, chatbot, file_upload, session_state, groq_key, fireworks_key],
                      [chatbot, session_state, msg_input, file_upload])
     new_btn.click(lambda: ([], create_session(), None, ""), outputs=[chatbot, session_state, file_upload, msg_input])

     box-shadow: 2px 2px 0 #1F2937;
 }
+/* 무료 서비스 안내 박스 */
+.free-service-notice {
+    text-align: center;
+    padding: 10px 15px;
+    background: linear-gradient(135deg, #FEE2E2 0%, #FECACA 100%);
+    border: 3px solid #1F2937;
+    border-radius: 8px;
+    margin: 10px 0;
+    box-shadow: 4px 4px 0 #1F2937;
+    font-family: 'Comic Neue', cursive;
+    font-weight: 700;
+    color: #991B1B;
+}
+.free-service-notice a {
+    color: #1D4ED8;
+    text-decoration: none;
+    font-weight: 700;
+}
+.free-service-notice a:hover {
+    text-decoration: underline;
+}
 .gr-panel, .gr-box, .gr-form, .block, .gr-group {
     background: #FFF !important;
     border: 3px solid #1F2937 !important;
     font-size: 1.5rem;
 }
+/* Markdown 강조 박스 */
+.markdown-highlight-box {
+    background: linear-gradient(135deg, #EC4899 0%, #F472B6 100%) !important;
+    border: 4px solid #1F2937 !important;
+    border-radius: 12px !important;
+    padding: 20px !important;
+    margin: 15px 0 !important;
+    box-shadow: 6px 6px 0 #1F2937 !important;
+    animation: pulse-glow 2s ease-in-out infinite;
+}
+@keyframes pulse-glow {
+    0%, 100% { box-shadow: 6px 6px 0 #1F2937; }
+    50% { box-shadow: 8px 8px 0 #1F2937, 0 0 20px rgba(236, 72, 153, 0.5); }
+}
+.markdown-title {
+    font-family: 'Bangers', cursive !important;
+    font-size: 2rem !important;
+    color: #FFF !important;
+    text-shadow: 3px 3px 0 #1F2937 !important;
+    letter-spacing: 2px !important;
+    margin-bottom: 15px !important;
+    text-align: center !important;
+}
+.markdown-benefits {
+    display: grid;
+    grid-template-columns: repeat(auto-fit, minmax(180px, 1fr));
+    gap: 12px;
+    margin-top: 10px;
+}
+.markdown-benefit-item {
+    background: rgba(255,255,255,0.95) !important;
+    border: 3px solid #1F2937 !important;
+    border-radius: 8px !important;
+    padding: 12px !important;
+    box-shadow: 3px 3px 0 #1F2937 !important;
+    font-family: 'Comic Neue', cursive !important;
+    font-weight: 700 !important;
+    font-size: 0.95rem !important;
+    color: #1F2937 !important;
+    text-align: center !important;
+}
+.markdown-benefit-icon {
+    font-size: 1.8rem !important;
+    display: block !important;
+    margin-bottom: 5px !important;
+}
 label, .gr-input-label, .gr-block-label {
     color: #1F2937 !important;
     font-family: 'Comic Neue', cursive !important;
 # ============== LLM API ==============
 def call_groq_api_stream(messages: List[Dict], api_key: str) -> Generator[str, None, None]:
     if not api_key:
+        yield "❌ Groq API 키가 설정되지 않았습니다. 환경변수 GROQ_API_KEY를 설정해주세요."
         return
     try:
         response = requests.post(
             "https://api.groq.com/openai/v1/chat/completions",
             headers={"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"},
             json={
+                "model": "mopenai/gpt-oss-120b",
                 "messages": messages,
                 "temperature": 0.7,
                 "max_tokens": 8192,
 def call_fireworks_api_stream(messages: List[Dict], image_base64: str, mime_type: str, api_key: str) -> Generator[str, None, None]:
     if not api_key:
+        yield "❌ Fireworks API 키가 설정되지 않았습니다. 환경변수 FIREWORKS_API_KEY를 설정해주세요."
         return
     try:
         formatted_messages = [{"role": m["role"], "content": m["content"]} for m in messages[:-1]]
             headers={"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"},
             json={
                 "model": "accounts/fireworks/models/qwen3-vl-235b-a22b-thinking",
+                "max_tokens": 8000,
                 "temperature": 0.6,
                 "messages": formatted_messages,
                 "stream": True
     if is_hwp_file(file_path) or is_hwpx_file(file_path):
         text, error = extract_text_from_hwp_or_hwpx(file_path)
         if text and len(text.strip()) > 20:
+            print(f"📄 [문서 내용 추출 완료] {len(text)} 글자")
+            print(f"📄 [문서 미리보기] {text[:500]}...")
+            return "text", text, None
         return "error", f"한글 문서 추출 실패: {error}", None
     if is_pdf_file(file_path):
         text = extract_text_from_pdf(file_path)
         if text:
+            print(f"📄 [PDF 내용 추출 완료] {len(text)} 글자")
+            return "text", text, None
         return "error", "PDF 추출 실패", None
     if is_text_file(file_path):
         text = extract_text_from_txt(file_path)
         if text:
+            return "text", text, None
         return "error", "텍스트 읽기 실패", None
     return "unsupported", f"지원하지 않는 형식: {filename}", None
 def chat_response(message: str, history: List[Dict], file: Optional[str],
+                  session_id: str) -> Generator[tuple, None, None]:
     if history is None:
         history = []
     if not message.strip() and not file:
     file_type, file_content, file_mime = None, None, None
     file_info = None
+    filename = None
     if file:
+        filename = os.path.basename(file)
         file_type, file_content, file_mime = process_file(file)
+        file_info = json.dumps({"type": file_type, "filename": filename})
         if file_type == "error":
             history = history + [
             yield history, session_id
             return
+    # 사용자 메시지 표시
     user_msg = message
     if file:
         user_msg = f"📎 {filename}\n\n{message}" if message else f"📎 {filename}"
     history = history + [{"role": "user", "content": user_msg}, {"role": "assistant", "content": ""}]
     yield history, session_id
+    # 이전 대화 불러오기
     db_messages = get_session_messages(session_id, limit=10)
+    # 시스템 프롬프트 - 문서 분석 강화
+    system_prompt = """당신은 문서 분석 전문 AI 어시스턴트입니다.
+## 핵심 역할
+- 사용자가 업로드한 문서의 내용을 **정확하게 분석**하고 **구체적으로 답변**합니다.
+- 문서에 있는 **실제 내용**을 기반으로만 답변합니다.
+- 문서에 없는 내용은 추측하지 않습니다.
+## 문서 분석 방법
+1. **문서가 제공되면**: 문서 전체 내용을 꼼꼼히 읽고 핵심 정보를 파악합니다.
+2. **요약 요청 시**: 문서의 주제, 목적, 핵심 내용, 주요 항목을 구조화하여 요약합니다.
+3. **질문 응답 시**: 문서에서 관련 내용을 찾아 **직접 인용하거나 구체적으로 설명**합니다.
+## 답변 형식
+- 한국어로 자연스럽고 명확하게 답변합니다.
+- 문서 내용을 인용할 때는 구체적으로 언급합니다.
+- 긴 문서는 섹션별로 나누어 정리합니다.
+## 주의사항
+- 문서에 **실제로 있는 내용만** 답변에 포함합니다.
+- 불확실한 내용은 "문서에서 확인되지 않습니다"라고 명시합니다."""
+    api_messages = [{"role": "system", "content": system_prompt}]
+    # 이전 대화 추가
     for m in db_messages:
         api_messages.append({"role": m["role"], "content": m["content"]})
+    # 현재 메시지 구성 - 문서 내용을 명확하게 구분
     if file_type == "text" and file_content:
+        if message:
+            current_content = f"""## 📄 업로드된 문서 내용 ({filename})
+다음은 사용자가 업로드한 문서의 전체 내용입니다:
+---
+{file_content}
+---
+## 💬 사용자 질문
+{message}
+위 문서 내용을 바탕으로 사용자의 질문에 **구체적이고 정확하게** 답변해주세요."""
+        else:
+            current_content = f"""## 📄 업로드된 문서 내용 ({filename})
+다음은 사용자가 업로드한 문서의 전체 내용입니다:
+---
+{file_content}
+---
+## 📋 요청사항
+위 문서의 내용을 다음 형식으로 **상세하게 요약**해주세요:
+1. **문서 제목/주제**: 문서가 다루는 주요 주제
+2. **문서 목적**: 이 문서의 작성 목적
+3. **핵심 내용**: 가장 중요한 내용 3-5���지
+4. **세부 항목**: 문서에 포함된 주요 섹션이나 항목
+5. **결론/요약**: 문서의 핵심 메시지"""
+    else:
+        current_content = message or ""
     api_messages.append({"role": "user", "content": current_content})
+    # 디버그 로그
+    print(f"\n🤖 [API 요청]")
+    print(f"  - 메시지 수: {len(api_messages)}")
+    print(f"  - 파일 타입: {file_type}")
+    print(f"  - 문서 길이: {len(file_content) if file_content else 0} 글자")
+    if file_content:
+        print(f"  - 문서 미리보기: {file_content[:200]}...")
+    # 응답 생성
     full_response = ""
     if file_type == "image":
+        for chunk in call_fireworks_api_stream(api_messages, file_content, file_mime, FIREWORKS_API_KEY):
             full_response += chunk
             history[-1] = {"role": "assistant", "content": full_response}
             yield history, session_id
     else:
+        for chunk in call_groq_api_stream(api_messages, GROQ_API_KEY):
             full_response += chunk
             history[-1] = {"role": "assistant", "content": full_response}
             yield history, session_id
+    # DB 저장
     save_message(session_id, "user", current_content, file_info)
     save_message(session_id, "assistant", full_response)
                     f.write(text)
             ext = ".txt"
+        elif output_format == "⭐ MARKDOWN (추천)":
             text, error = convert_hwp_to_markdown(input_path)
             if text:
                 output_path = os.path.join(tmp_dir, "output.md")
     </div>
     """)
+    # 무료 서비스 안내
+    gr.HTML("""
+    <div class="free-service-notice">
+        🆓 본 서비스는 <b>무료 버전</b>으로 일부 기능에 제약이 있습니다.<br>
+        📧 문의: <a href="mailto:arxivgpt@gmail.com">arxivgpt@gmail.com</a>
+    </div>
+    """)
     session_state = gr.State("")
     with gr.Tabs():
             with gr.Row():
                 with gr.Column(scale=1):
                     gr.HTML("""
                     <div class="info-box">
                         📁 <b>지원 파일 형식</b><br><br>
             </div>
             """)
+            # Markdown 강조 박스
+            gr.HTML("""
+            <div class="markdown-highlight-box">
+                <div class="markdown-title">⭐ MARKDOWN 변환 추천! ⭐</div>
+                <div class="markdown-benefits">
+                    <div class="markdown-benefit-item">
+                        <span class="markdown-benefit-icon">🤖</span>
+                        <b>AI/LLM 최적화</b><br>
+                        ChatGPT, Claude 등 AI에 바로 입력 가능
+                    </div>
+                    <div class="markdown-benefit-item">
+                        <span class="markdown-benefit-icon">📝</span>
+                        <b>범용 포맷</b><br>
+                        GitHub, Notion, 블로그 등 어디서나 사용
+                    </div>
+                    <div class="markdown-benefit-item">
+                        <span class="markdown-benefit-icon">🔍</span>
+                        <b>구조 유지</b><br>
+                        제목, 목록, 표 등 문서 구조 보존
+                    </div>
+                    <div class="markdown-benefit-item">
+                        <span class="markdown-benefit-icon">⚡</span>
+                        <b>가볍고 빠름</b><br>
+                        용량이 작고 처리 속도 빠름
+                    </div>
+                    <div class="markdown-benefit-item">
+                        <span class="markdown-benefit-icon">🔄</span>
+                        <b>변환 용이</b><br>
+                        HTML, PDF, Word 등으로 재변환 가능
+                    </div>
+                    <div class="markdown-benefit-item">
+                        <span class="markdown-benefit-icon">✏️</span>
+                        <b>편집 간편</b><br>
+                        메모장으로도 바로 수정 가능
+                    </div>
+                </div>
+            </div>
+            """)
             with gr.Row():
                 with gr.Column():
                     gr.HTML('<div class="info-box">📤 <b>파일 업로드</b></div>')
                         elem_classes=["upload-box"]
                     )
                     format_select = gr.Radio(
+                        ["⭐ MARKDOWN (추천)", "TXT (텍스트)", "HTML", "ODT (OpenDocument)", "XML"],
+                        value="⭐ MARKDOWN (추천)",
                         label="📋 변환 형식"
                     )
                     convert_btn = gr.Button("🔄 변환하기", variant="primary", size="lg")
             gr.HTML("""
             <div class="info-box">
+                ℹ️ <b>안내</b>: HWPX 파일은 MARKDOWN, TXT, XML 변환만 지원됩니다.
             </div>
             """)
         <p style="font-family:'Bangers',cursive;font-size:1.8rem;letter-spacing:2px">📄 HWP AI 어시스턴트 🤖</p>
         <p>AI가 HWP 파일을 읽고, 보고, 말하며, 생각하고 기억합니다!</p>
         <p>📖 READ • 👁️ SEE • 💬 SPEAK • 🧠 THINK • 💾 MEMORY</p>
+        <p style="margin-top:8px;font-size:0.9rem;">🆓 무료 서비스 (일부 기능 제한) | 📧 arxivgpt@gmail.com</p>
         <p style="margin-top:10px"><a href="https://www.humangen.ai" target="_blank" style="color:#FACC15;text-decoration:none;font-weight:bold;">🏠 www.humangen.ai</a></p>
     </div>
     """)
     # ============== 이벤트 핸들러 ==============
+    def on_submit(msg, hist, f, sid):
         if hist is None:
             hist = []
+        for r in chat_response(msg, hist, f, sid):
             yield r[0], r[1], "", None
+    submit_btn.click(on_submit, [msg_input, chatbot, file_upload, session_state],
                      [chatbot, session_state, msg_input, file_upload])
+    msg_input.submit(on_submit, [msg_input, chatbot, file_upload, session_state],
                      [chatbot, session_state, msg_input, file_upload])
     new_btn.click(lambda: ([], create_session(), None, ""), outputs=[chatbot, session_state, file_upload, msg_input])