Spaces:

Corin1998
/

HFResumeIntakeSystem

Runtime error

App Files Files Community

Corin1998 commited on Nov 23, 2025

Commit

2ad7640

verified ·

1 Parent(s): 44d16b3

Update pipelines/openai_ingest.py

Browse files

Files changed (1) hide show

pipelines/openai_ingest.py +4 -16

pipelines/openai_ingest.py CHANGED Viewed

@@ -14,7 +14,7 @@ _client = None
 def _client_lazy():
     global _client
     if _client is None:
-        key = os.environ.get("OPENAI_API_KEY") or os.environ.get("OPENAI_APIKEY")
         if not key:
             raise RuntimeError(
                 "OPENAI_API_KEY (または OPENAI_APIKEY) が未設定です。Spaces > Settings > Variables and secrets で追加してください。"
@@ -38,7 +38,6 @@ def extract_text_with_openai(payload: bytes, filename: str, filetype: str) -> st
     """画像/PDFは画像化してVisionに渡す。テキストは整形依頼してきれいな本文を返す。"""
     client = _client_lazy()
-    # 画像群を構築
     images: List[Image.Image] = []
     if filetype == "pdf":
         images = _pdf_to_images(payload)
@@ -81,9 +80,7 @@ def structure_with_openai(text: str) -> dict:
         " JSONキー: work_experience_raw, education_raw, certifications_raw, skills_list。"
         " skills_list は重複除去済み配列。work_experience_raw等は原文抜粋で良い。"
     )
-    user = (
-        "以下のテキストを解析し、指定のJSONキーで返してください。\n\n" + text
-    )
     resp = client.responses.create(
         model=MODEL_TEXT,
         input=[
@@ -105,9 +102,7 @@ def structure_with_openai(text: str) -> dict:
 def summarize_with_openai(text: str) -> dict:
     client = _client_lazy()
-    prompt = (
-        "以下の候補者レジュメ本文を、(1)300字、(2)100字、(3)1文 の3粒度で日本語要約してください。余計な記号は避け、事実を簡潔に。"
-    )
     resp = client.responses.create(
         model=MODEL_TEXT,
         input=[
@@ -116,15 +111,8 @@ def summarize_with_openai(text: str) -> dict:
         ],
     )
     full = resp.output_text
-    # 簡易パース（区切り語で抽出）。失敗時は同文を複写
-    def _slice(full_txt, marker, fallback):
-        import re
-        m = re.search(marker + r"[\s\S]*?\n", full_txt)
-        return (m.group(0).split("\n")[0] if m else fallback).strip()
     return {
-        "300chars": full[:300*2] if len(full) > 0 else "",
         "100chars": full[:120] if len(full) > 0 else "",
         "onesent": full.split("。")[0] + "。" if "。" in full else full,
     }

 def _client_lazy():
     global _client
     if _client is None:
+        key = os.environ.get("OPENAI_API_KEY") or os.environ.get("OPENAI_APIKEY")  # ← フォールバック追加
         if not key:
             raise RuntimeError(
                 "OPENAI_API_KEY (または OPENAI_APIKEY) が未設定です。Spaces > Settings > Variables and secrets で追加してください。"
     """画像/PDFは画像化してVisionに渡す。テキストは整形依頼してきれいな本文を返す。"""
     client = _client_lazy()
     images: List[Image.Image] = []
     if filetype == "pdf":
         images = _pdf_to_images(payload)
         " JSONキー: work_experience_raw, education_raw, certifications_raw, skills_list。"
         " skills_list は重複除去済み配列。work_experience_raw等は原文抜粋で良い。"
     )
+    user = "以下のテキストを解析し、指定のJSONキーで返してください。\n\n" + text
     resp = client.responses.create(
         model=MODEL_TEXT,
         input=[
 def summarize_with_openai(text: str) -> dict:
     client = _client_lazy()
+    prompt = "以下の候補者レジュメ本文を、(1)300字、(2)100字、(3)1文 の3粒度で日本語要約してください。余計な記号は避け、事実を簡潔に。"
     resp = client.responses.create(
         model=MODEL_TEXT,
         input=[
         ],
     )
     full = resp.output_text
     return {
+        "300chars": full[:600] if len(full) > 0 else "",
         "100chars": full[:120] if len(full) > 0 else "",
         "onesent": full.split("。")[0] + "。" if "。" in full else full,
     }