File size: 11,712 Bytes
52a881a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
from __future__ import annotations

import os
import re
from typing import Optional

from openai import AsyncOpenAI


class DeepSeekService:
    """OpenAI-compatible DeepSeek refinement service."""

    def __init__(self, api_key: Optional[str] = None):
        self.api_key = api_key or os.environ.get("DEEPSEEK_API_KEY")
        self.base_url = "https://api.deepseek.com"
        self.model = "deepseek-chat"
        self.client = None
        self.is_loaded = False

        print("DeepSeek API service initializing...")
        print(f"API Base URL: {self.base_url}")

    async def load(self):
        try:
            if not self.api_key:
                print("DeepSeek API key not provided")
                self.is_loaded = False
                return

            self.client = AsyncOpenAI(api_key=self.api_key, base_url=self.base_url)
            self.is_loaded = True
            print("DeepSeek API service is ready!")
        except Exception as exc:
            print(f"DeepSeek API service initialization failed: {exc}")
            self.is_loaded = False

    async def refine_diagnosis(
        self,
        raw_answer: str,
        raw_thinking: Optional[str] = None,
        language: str = "zh",
    ) -> dict:
        if not self.is_loaded or self.client is None:
            error_msg = (
                "API not initialized, cannot generate analysis"
                if language == "en"
                else "API未初始化,无法生成分析过程"
            )
            print("DeepSeek API not initialized, returning original result")
            return {
                "success": False,
                "description": "",
                "analysis_process": raw_thinking or error_msg,
                "diagnosis_result": raw_answer,
                "original_diagnosis": raw_answer,
                "error": "DeepSeek API not initialized",
            }

        try:
            prompt = self._build_refine_prompt(raw_answer, raw_thinking, language)
            system_content = (
                "You are a professional medical text editor. Your task is to polish and organize "
                "medical diagnostic text to make it flow smoothly while preserving the original "
                "meaning. Output ONLY the formatted result. Do NOT add any explanations, comments, "
                "or thoughts. Just follow the format exactly."
                if language == "en"
                else "你是医学文本整理专家,按照用户要求将用户输入的文本整理成用户想要的格式,不要改写或总结。"
            )

            response = await self.client.chat.completions.create(
                model=self.model,
                messages=[
                    {"role": "system", "content": system_content},
                    {"role": "user", "content": prompt},
                ],
                temperature=0.1,
                max_tokens=2048,
                top_p=0.8,
            )

            generated_text = response.choices[0].message.content
            parsed = self._parse_refined_output(generated_text, raw_answer, raw_thinking, language)

            return {
                "success": True,
                "description": parsed["description"],
                "analysis_process": parsed["analysis_process"],
                "diagnosis_result": parsed["diagnosis_result"],
                "original_diagnosis": raw_answer,
                "raw_refined": generated_text,
            }
        except Exception as exc:
            print(f"DeepSeek API call failed: {exc}")
            error_msg = (
                "API call failed, cannot generate analysis"
                if language == "en"
                else "API调用失败,无法生成分析过程"
            )
            return {
                "success": False,
                "description": "",
                "analysis_process": raw_thinking or error_msg,
                "diagnosis_result": raw_answer,
                "original_diagnosis": raw_answer,
                "error": str(exc),
            }

    def _build_refine_prompt(
        self,
        raw_answer: str,
        raw_thinking: Optional[str] = None,
        language: str = "zh",
    ) -> str:
        thinking_text = raw_thinking if raw_thinking else "No analysis process available."
        if language == "en":
            return f"""You are a text organization expert. There are two texts that need to be organized. Text 1 is the thinking process of the SkinGPT model, and Text 2 is the diagnosis result given by SkinGPT.

【Requirements】
- Preserve the original tone and expression style
- Text 1 contains the thinking process, Text 2 contains the diagnosis result
- Extract the image observation part from the thinking process as Description. This should include all factual observations about what was seen in the image, not just a brief summary.
- For Diagnostic Reasoning: refine and condense the remaining thinking content. Remove redundancies, self-doubt, circular reasoning, and unnecessary repetition. Keep it concise and not too long. Keep the logical chain clear and enhance readability. IMPORTANT: DO NOT include any image description or visual observations in Diagnostic Reasoning. Only include reasoning, analysis, and diagnostic thought process.
- If [Text 1] content is NOT: No analysis process available. Then organize [Text 1] content accordingly, DO NOT confuse [Text 1] and [Text 2]
- If [Text 1] content IS: No analysis process available. Then extract the analysis process and description from [Text 2]
- DO NOT infer or add new medical information, DO NOT output any meta-commentary
- You may adjust unreasonable statements or remove redundant content to improve clarity

[Text 1]
{thinking_text}

[Text 2]
{raw_answer}

【Output】Only output three sections, do not output anything else:
## Description
(Extract all image observation content from the thinking process - include all factual descriptions of what was seen)

## Analysis Process
(Refined and condensed diagnostic reasoning: remove self-doubt, circular logic, and redundancies. Keep it concise and not too long. Keep logical flow clear. Do NOT include image observations)

## Diagnosis Result
(The organized diagnosis result from Text 2)
"""

        return f"""你是一个文本整理专家。有两段文本需要整理,文本1是SkinGPT模型的思考过程的文本,文本2是SkinGPT给出的诊断结果的文本。

【要求】
- 保留原文的语气和表达方式
- 文本1是思考过程,文本2是诊断结果
- 从思考过程中提取图像观察部分作为图像描述。需要包含所有关于图片中观察到的事实内容,不要简化或缩短。
- 对于分析过程:提炼并精简剩余的思考内容,去除冗余、自我怀疑、兜圈子的内容。保持简洁,不要太长。保持逻辑链条清晰,增强可读性。重要:分析过程中不要包含任何图像描述或视觉观察内容,只包含推理、分析和诊断思考过程。
- 如果【文本1】内容不是:No analysis process available.那么按要求整理【文本1】的内容,不要混淆【文本1】和【文本2】。
- 如果【文本1】内容是:No analysis process available.那么从【文本2】提炼分析过程和描述。
- 【文本1】和【文本2】需要翻译成简体中文
- 禁止推断或添加新的医学信息,禁止输出任何元评论
- 可以调整不合理的语句或去除冗余内容以提高清晰度

【文本1】
{thinking_text}

【文本2】
{raw_answer}

【输出】只输出三个部分,不要输出其他任何内容:
## 图像描述
(从思考过程中提取所有图像观察内容,包含所有关于图片的事实描述)

## 分析过程
(提炼并精简后的诊断推理:去除自我怀疑、兜圈逻辑和冗余内容。保持简洁,不要太长。保持逻辑流畅。不包含图像观察)

## 诊断结果
(整理后的诊断结果)
"""

    def _parse_refined_output(
        self,
        generated_text: str,
        raw_answer: str,
        raw_thinking: Optional[str] = None,
        language: str = "zh",
    ) -> dict:
        description = ""
        analysis_process = None
        diagnosis_result = None

        if language == "en":
            desc_match = re.search(
                r"##\s*Description\s*\n([\s\S]*?)(?=##\s*Analysis\s*Process|$)",
                generated_text,
                re.IGNORECASE,
            )
            analysis_match = re.search(
                r"##\s*Analysis\s*Process\s*\n([\s\S]*?)(?=##\s*Diagnosis\s*Result|$)",
                generated_text,
                re.IGNORECASE,
            )
            result_match = re.search(
                r"##\s*Diagnosis\s*Result\s*\n([\s\S]*?)$",
                generated_text,
                re.IGNORECASE,
            )
            desc_header = "## Description"
            analysis_header = "## Analysis Process"
            result_header = "## Diagnosis Result"
        else:
            desc_match = re.search(r"##\s*图像描述\s*\n([\s\S]*?)(?=##\s*分析过程|$)", generated_text)
            analysis_match = re.search(r"##\s*分析过程\s*\n([\s\S]*?)(?=##\s*诊断结果|$)", generated_text)
            result_match = re.search(r"##\s*诊断结果\s*\n([\s\S]*?)$", generated_text)
            desc_header = "## 图像描述"
            analysis_header = "## 分析过程"
            result_header = "## 诊断结果"

        if desc_match:
            description = desc_match.group(1).strip()
        else:
            description = ""

        if analysis_match:
            analysis_process = analysis_match.group(1).strip()
        else:
            result_pos = generated_text.find(result_header)
            if result_pos > 0:
                analysis_process = generated_text[:result_pos].strip()
                for header in [desc_header, analysis_header]:
                    analysis_process = re.sub(f"{re.escape(header)}\\s*\\n?", "", analysis_process).strip()
            else:
                analysis_process = generated_text[: len(generated_text) // 2].strip()
            if not analysis_process and raw_thinking:
                analysis_process = raw_thinking

        if result_match:
            diagnosis_result = result_match.group(1).strip()
        else:
            result_pos = generated_text.find(result_header)
            if result_pos > 0:
                diagnosis_result = generated_text[result_pos:].strip()
                diagnosis_result = re.sub(
                    f"^{re.escape(result_header)}\\s*\\n?",
                    "",
                    diagnosis_result,
                ).strip()
            else:
                diagnosis_result = generated_text[len(generated_text) // 2 :].strip()
            if not diagnosis_result:
                diagnosis_result = raw_answer

        return {
            "description": description,
            "analysis_process": analysis_process,
            "diagnosis_result": diagnosis_result,
        }


_deepseek_service: Optional[DeepSeekService] = None


async def get_deepseek_service(api_key: Optional[str] = None) -> Optional[DeepSeekService]:
    global _deepseek_service

    if _deepseek_service is None:
        try:
            _deepseek_service = DeepSeekService(api_key=api_key)
            await _deepseek_service.load()
            if not _deepseek_service.is_loaded:
                print("DeepSeek API service initialization failed, will use fallback mode")
                return _deepseek_service
        except Exception as exc:
            print(f"DeepSeek service initialization failed: {exc}")
            return None

    return _deepseek_service