Spaces:

Slicelayers
/

live2d-image-test

Sleeping

App Files Files Community

Slicelayers commited on Oct 19, 2025

Commit

ca28d65

verified ·

1 Parent(s): c7396ab

Update app.py

Browse files

Files changed (1) hide show

app.py +62 -45

app.py CHANGED Viewed

@@ -9,7 +9,8 @@ import json
 import time
 import asyncio
 import os
-import cv2 # ★★★ 変更点1: OpenCVを追加
 # --- 定数とAPI設定 (Constants and API Configuration) ---
@@ -29,12 +30,14 @@ def pil_to_base64(img: Image.Image) -> str:
     img.save(buffered, format="PNG")
     return base64.b64encode(buffered.getvalue()).decode("utf-8")
 async def nano_banana_completion_api(base_image: Image.Image, prompt: str) -> Image.Image:
     """
-    Nano Banana (gemini-2.5-flash-image-preview) APIを呼び出し、画像補完をシミュレートします。
-    (この関数はモックのままです)
     """
     # Base64エンコード
     base64_image = pil_to_base64(base_image)
@@ -42,13 +45,17 @@ async def nano_banana_completion_api(base_image: Image.Image, prompt: str) -> Im
     payload = {
         "contents": [
             {
-                "text": f"画像を編集・補完してください。この画像はLive2D素材の一部です。マスクされた（透明な）領域にプロンプトに従った内容を生成し、画像を自然に完成させてください。プロンプト: {prompt}"
-            },
-            {
-                "inlineData": {
-                    "mimeType": "image/png",
-                    "data": base64_image
-                }
             }
         ],
         "generationConfig": {
@@ -58,40 +65,49 @@ async def nano_banana_completion_api(base_image: Image.Image, prompt: str) -> Im
     print(f"--- API呼び出しペイロードを構築しました。プロンプト: {prompt} ---")
-    # --- 実際のAPI呼び出しのシミュレーションと代替処理 ---
-    # APIキーが設定されている場合は、ここでhttpxなどを使った非同期APIコールを行う
-    # if API_KEY:
-    #     async with httpx.AsyncClient() as client:
-    #         response = await client.post(API_URL + API_KEY, json=payload, timeout=60)
-    #         # ... (レスポンス処理と画像デコード) ...
-    # else:
-    await asyncio.sleep(4) # 処理時間をシミュレート
-    # 補完処理が成功したと仮定し、モック画像を作成
-    completed_image = base_image.copy()
-    draw = ImageDraw.Draw(completed_image)
-    try:
-        # WindowsやLinux環境で一般的なフォントを指定
-        font_path = "/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf" if os.path.exists("/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf") else "arial.ttf"
-        font = ImageFont.truetype(font_path, 40)
-    except IOError:
-        font = ImageFont.load_default()
-    text = "AI補完済み (MOCK)"
-    text_color = (255, 0, 0, 200) # 半透明の赤
-    w, h = completed_image.size
-    # ImageDraw.textbbox を使用してテキストの境界ボックスを取得
-    text_bbox = draw.textbbox((0, 0), text, font=font)
-    tw, th = text_bbox[2] - text_bbox[0], text_bbox[3] - text_bbox[1]
-    draw.text(((w - tw) / 2, (h - th) / 2), text, font=font, fill=text_color)
-    print("--- AI補完処理をモック完了しました ---")
-    return completed_image
 # --- メイン処理ロジック (Main Processing Logic) ---
@@ -128,9 +144,10 @@ async def segment_and_inpaint(original_image: Image.Image, inpaint_prompt: str):
     )
     # 境界を滑らかにするためのぼかし処理 (アンチエイリアス/フェザー処理のシミュレーション)
-    hair_mask_np = cv2.GaussianBlur(hair_mask_np, (35, 35), 0)
-    # 2値化は行わず、ぼかし後のグレースケール値をそのまま透明度として使用 (よりリアルなフェザー)
     # NumPy配列からPIL Imageに変換
     hair_mask = Image.fromarray(hair_mask_np, mode='L') # Lモード（グレースケール）
@@ -221,8 +238,8 @@ with gr.Blocks(theme=theme, title="Live2D素材自動分割・補完アプリ")
         """
         <div style='text-align: center; margin-bottom: 20px; padding: 10px; background: #E0F7FA; border-radius: 12px;'>
             <h1 style='color: #00796B; font-size: 2.5em; font-weight: 700;'>🎨 Live2D 素材 自動分割・補完アプリ 🤖</h1>
-            <p style='color: #004D40; font-size: 1.1em;'>一枚絵をアップロードするだけで、AIによるパーツ分割と欠損部分の自動補完（Nano Banana API利用）をシミュレートします。</p>
-            <p style='color: #004D40; font-size: 1.0em;'>💡 **CV2 (OpenCV) を使用し、楕円形のぼかしたマスクでより自然なパーツ分割をシミュレートしています。**</p>
         </div>
         """
     )

 import time
 import asyncio
 import os
+import cv2
+import httpx # ★★★ 変更点: httpx を追加
 # --- 定数とAPI設定 (Constants and API Configuration) ---
     img.save(buffered, format="PNG")
     return base64.b64encode(buffered.getvalue()).decode("utf-8")
+# ★★★ 変更点: APIモックから実APIコールへ変更 ★★★
 async def nano_banana_completion_api(base_image: Image.Image, prompt: str) -> Image.Image:
     """
+    Nano Banana (gemini-2.5-flash-image-preview) APIを呼び出し、画像補完を実行します。
     """
+    if not API_KEY:
+        raise gr.Error("エラー: APIキーが設定されていません。Hugging Face Secretsで 'NANO_BANANA_API' を設定してください。")
     # Base64エンコード
     base64_image = pil_to_base64(base_image)
     payload = {
         "contents": [
             {
+                "parts": [
+                    {
+                        "text": f"画像を編集・補完してください。この画像はLive2D素材の一部です。マスクされた（透明な）領域にプロンプトに従った内容を生成し、画像を自然に完成させてください。プロンプト: {prompt}"
+                    },
+                    {
+                        "inlineData": {
+                            "mimeType": "image/png",
+                            "data": base64_image
+                        }
+                    }
+                ]
             }
         ],
         "generationConfig": {
     print(f"--- API呼び出しペイロードを構築しました。プロンプト: {prompt} ---")
+    # --- 実際のAPI呼び出しロジック (httpxを使用) ---
+    final_api_url = API_URL + API_KEY
+    # 指数バックオフ付きリトライロジック
+    max_retries = 3
+    delay = 1
+    for attempt in range(max_retries):
+        try:
+            async with httpx.AsyncClient(timeout=30.0) as client:
+                response = await client.post(final_api_url, json=payload)
+                response.raise_for_status()  # 200番台以外のステータスコードで例外を発生させる
+            result = response.json()
+            candidate = result.get('candidates', [{}])[0]
+            # Base64画像データの抽出
+            base64_data = None
+            for part in candidate.get('content', {}).get('parts', []):
+                if 'inlineData' in part and part['inlineData']['mimeType'].startswith('image/'):
+                    base64_data = part['inlineData']['data']
+                    break
+            if base64_data:
+                # Base64データをデコードしてPIL Imageに変換
+                image_data = base64.b64decode(base64_data)
+                completed_image = Image.open(io.BytesIO(image_data)).convert('RGBA')
+                print("--- AI補完処理を完了しました (実API) ---")
+                return completed_image
+            else:
+                raise ValueError("APIレスポンスから画像データが抽出できませんでした。")
+        except httpx.HTTPStatusError as e:
+            if e.response.status_code in [429, 503] and attempt < max_retries - 1:
+                print(f"APIレート制限/サーバーエラー (429/503)。{delay}秒待機後にリトライします...")
+                await asyncio.sleep(delay)
+                delay *= 2  # 指数バックオフ
+            else:
+                raise gr.Error(f"API呼び出しエラー: {e}")
+        except Exception as e:
+            raise gr.Error(f"予期せぬエラーが発生しました: {e}")
+    raise gr.Error("APIリクエストが最大リトライ回数を超えて失敗しました。")
 # --- メイン処理ロジック (Main Processing Logic) ---
     )
     # 境界を滑らかにするためのぼかし処理 (アンチエイリアス/フェザー処理のシミュレーション)
+    # ぼかしの強度を調整
+    kernel_size = min(W, H) // 30
+    kernel_size = kernel_size if kernel_size % 2 == 1 else kernel_size + 1 # カーネルサイズは奇数にする
+    hair_mask_np = cv2.GaussianBlur(hair_mask_np, (kernel_size, kernel_size), 0)
     # NumPy配列からPIL Imageに変換
     hair_mask = Image.fromarray(hair_mask_np, mode='L') # Lモード（グレースケール）
         """
         <div style='text-align: center; margin-bottom: 20px; padding: 10px; background: #E0F7FA; border-radius: 12px;'>
             <h1 style='color: #00796B; font-size: 2.5em; font-weight: 700;'>🎨 Live2D 素材 自動分割・補完アプリ 🤖</h1>
+            <p style='color: #004D40; font-size: 1.1em;'>一枚絵をアップロードするだけで、AIによるパーツ分割と欠損部分の自動補完（Nano Banana API利用）を**実稼働**させます。</p>
+            <p style='color: #004D40; font-size: 1.0em;'>💡 **注意:** AI補完機能を利用するには、Hugging Face Secretsに `NANO_BANANA_API` キーを設定する必要があります。</p>
         </div>
         """
     )