Spaces:

Corin1998
/

Score

Sleeping

App Files Files Community

Corin1998 commited on Aug 28, 2025

Commit

83f8482

verified ·

1 Parent(s): e582bdf

Update core/extract.py

Browse files

Files changed (1) hide show

core/extract.py +17 -9

core/extract.py CHANGED Viewed

@@ -2,7 +2,6 @@ from __future__ import annotations
 import json
 from typing import Any, Dict, List, Optional
 from .openai_client import get_client, VISION_MODEL, TEXT_MODEL
-from .pdf_io import b64
 SYSTEM_JSON = """あなたは有能な財務アナリストです。
 与えられた決算書（画像またはテキスト）から、次の厳密な JSON 構造のみを日本語の単位なし・半角数値で返してください。分からない項目は null。
@@ -27,19 +26,28 @@ SYSTEM_JSON = """あなたは有能な財務アナリストです。
 def extract_financials(images: Optional[List[bytes]], text_blob: Optional[str], company_hint: str="") -> Dict[str, Any]:
     client = get_client()
-    if images and len(images) > 0:
         content = [{"type": "text", "text": SYSTEM_JSON}]
         if company_hint:
             content.append({"type": "text", "text": f"会社名の候補: {company_hint}"})
         for im in images:
-            content.append({"type": "input_image", "image_url": f"data:image/png;base64,{b64(im)}"})
         resp = client.chat.completions.create(
             model=VISION_MODEL,
             messages=[
-                {"role": "system", "content": "返答は必ず有効な JSON オブジェクトのみ。説明は不要。"},
-                {"role": "user", "content": content},
             ],
-            response_format={"type": "json_object"},
             temperature=0.1,
         )
         return json.loads(resp.choices[0].message.content)
@@ -48,10 +56,10 @@ def extract_financials(images: Optional[List[bytes]], text_blob: Optional[str],
         resp = client.chat.completions.create(
             model=TEXT_MODEL,
             messages=[
-                {"role": "system", "content": "返答は必ず有効な JSON オブジェクトのみ。説明は不要。"},
-                {"role": "user", "content": prompt},
             ],
-            response_format={"type": "json_object"},
             temperature=0.1,
         )
         return json.loads(resp.choices[0].message.content)

 import json
 from typing import Any, Dict, List, Optional
 from .openai_client import get_client, VISION_MODEL, TEXT_MODEL
 SYSTEM_JSON = """あなたは有能な財務アナリストです。
 与えられた決算書（画像またはテキスト）から、次の厳密な JSON 構造のみを日本語の単位なし・半角数値で返してください。分からない項目は null。
 def extract_financials(images: Optional[List[bytes]], text_blob: Optional[str], company_hint: str="") -> Dict[str, Any]:
     client = get_client()
+    if images:
         content = [{"type": "text", "text": SYSTEM_JSON}]
         if company_hint:
             content.append({"type": "text", "text": f"会社名の候補: {company_hint}"})
         for im in images:
+            content.append({"type": "input_image", "image_url": f"data:image/png;base64,{im.decode('latin1') if isinstance(im, str) else 'data'}"})
+        # 上のデータ URI 生成は UI 側で行うためここでは未使用
+        # （UIでdata:image/png;base64,xxxを組む実装に合わせる場合は差し替え）
+        pass
+    # 実運用では UI 側で Vision を呼ぶ形にせず、ここで共通化
+    if images:
+        content = [{"type":"text","text":SYSTEM_JSON}]
+        for im in images:
+            import base64
+            content.append({"type":"input_image","image_url":f"data:image/png;base64,{base64.b64encode(im).decode('utf-8')}"})
         resp = client.chat.completions.create(
             model=VISION_MODEL,
             messages=[
+                {"role":"system","content":"返答は必ず有効な JSON オブジェクトのみ。説明は不要。"},
+                {"role":"user","content":content},
             ],
+            response_format={"type":"json_object"},
             temperature=0.1,
         )
         return json.loads(resp.choices[0].message.content)
         resp = client.chat.completions.create(
             model=TEXT_MODEL,
             messages=[
+                {"role":"system","content":"返答は必ず有効な JSON オブジェクトのみ。説明は不要。"},
+                {"role":"user","content":prompt},
             ],
+            response_format={"type":"json_object"},
             temperature=0.1,
         )
         return json.loads(resp.choices[0].message.content)