PoseMaker

Running

App Files Files Community

aiqtech commited on Aug 31, 2025

Commit

94ded05

verified ·

1 Parent(s): 8d84d68

Update app.py

Browse files

Files changed (1) hide show

app.py +533 -205

app.py CHANGED Viewed

@@ -1,205 +1,533 @@
-import gradio as gr
-import numpy as np
-import cv2
-from fastapi import FastAPI, Request, Response
-from src.body import Body
-import json as js
-body_estimation = Body('model/body_pose_model.pth')
-def pil2cv(image):
-    ''' PIL型 -> OpenCV型 '''
-    new_image = np.array(image, dtype=np.uint8)
-    if new_image.ndim == 2:  # モノクロ
-        pass
-    elif new_image.shape[2] == 3:  # カラー
-        new_image = cv2.cvtColor(new_image, cv2.COLOR_RGB2BGR)
-    elif new_image.shape[2] == 4:  # 透過
-        new_image = cv2.cvtColor(new_image, cv2.COLOR_RGBA2BGRA)
-    return new_image
-with open("static/poseEditor.js", "r") as f:
-    file_contents = f.read()
-app = FastAPI()
-@app.middleware("http")
-async def some_fastapi_middleware(request: Request, call_next):
-    path = request.scope['path']  # get the request route
-    response = await call_next(request)
-    if path == "/":
-        response_body = ""
-        async for chunk in response.body_iterator:
-            response_body += chunk.decode()
-        some_javascript = f"""
-        <script type="text/javascript" defer>
-{file_contents}
-        </script>
-        """
-        response_body = response_body.replace("</body>", some_javascript + "</body>")
-        del response.headers["content-length"]
-        return Response(
-            content=response_body,
-            status_code=response.status_code,
-            headers=dict(response.headers),
-            media_type=response.media_type
-        )
-    return response
-# make cndidate to json
-def candidate_to_json_string(arr):
-    a = [f'[{x:.2f}, {y:.2f}]' for x, y, *_ in arr]
-    return '[' + ', '.join(a) + ']'
-# make subset to json
-def subset_to_json_string(arr):
-    arr_str = ','.join(['[' + ','.join([f'{num:.2f}' for num in row]) + ']' for row in arr])
-    return '[' + arr_str + ']'
-def estimate_body(source):
-    if source == None:
-      return None
-    candidate, subset = body_estimation(pil2cv(source))
-    return "{ \"candidate\": " + candidate_to_json_string(candidate) + ", \"subset\": " + subset_to_json_string(subset) + " }"
-def image_changed(image):
-  if image == None:
-    return "estimation", {}
-  if 'openpose' in image.info:
-    print("pose found")
-    jsonText = image.info['openpose']
-    jsonObj = js.loads(jsonText)
-    subset = jsonObj['subset']
-    return f"""{image.width}px x {image.height}px, {len(subset)} indivisual(s)""", jsonText
-  else:
-    print("pose not found")
-    candidate, subset = body_estimation(pil2cv(image))
-    jsonText = "{ \"candidate\": " + candidate_to_json_string(candidate) + ", \"subset\": " + subset_to_json_string(subset) + " }"
-    return f"""{image.width}px x {image.height}px, {subset.shape[0]} indivisual(s)""", jsonText
-html_text = f"""
-    <canvas id="canvas" width="512" height="512"></canvas>
-    <script type="text/javascript" defer>{file_contents}</script>
-    """
-with gr.Blocks(css="""button { min-width: 80px; }""") as demo:
-  gr.Markdown(f"""
-## This project is no longer being updated. Please use [PoseMaker2](https://huggingface.co/spaces/jonigata/PoseMaker2) instead.
-### (That project uses MMPose for pose estimation.)
-""")
-  with gr.Row():
-    with gr.Column(scale=1):
-      width = gr.Slider(label="Width", minimum=512, maximum=1024, step=64, value=512, interactive=True)
-      height = gr.Slider(label="Height", minimum=512, maximum=1024, step=64, value=512, interactive=True)
-      with gr.Accordion(label="Pose estimation", open=False):
-        source = gr.Image(type="pil")
-        estimationResult = gr.Markdown("""estimation""")
-        with gr.Row():
-          with gr.Column(min_width=80):
-            applySizeBtn = gr.Button(value="Apply size")
-          with gr.Column(min_width=80):
-            replaceBtn = gr.Button(value="Replace")
-          with gr.Column(min_width=80):
-            importBtn = gr.Button(value="Import")
-      with gr.Accordion(label="Json", open=False):
-        with gr.Row():
-          with gr.Column(min_width=80):
-            replaceWithJsonBtn = gr.Button(value="Replace")
-          with gr.Column(min_width=80):
-            importJsonBtn = gr.Button(value="Import")
-        gr.Markdown("""
-| inout            | how to                                                                               |
-| -----------------| ----------------------------------------------------------------------------------------- |
-| Import | Paste json to "Json source" and click "Read", edit the width/height, then click "Replace" or "Import". |
-| Export | click "Save" and "Copy to clipboard" of "Json" section.                                             |
-""")
-        json = gr.JSON(label="Json")
-        jsonSource = gr.Textbox(label="Json source", lines=10)
-      with gr.Accordion(label="Notes", open=False):
-        gr.Markdown("""
-#### How to bring pose to ControlNet
-1. Press **Save** button
-2. **Drag** the file placed at the bottom left corder of browser
-3. **Drop** the file into ControlNet
-#### Points to note for pseudo-3D rotation
-When performing pseudo-3D rotation on the X and Y axes, the projection is converted to 2D and Z-axis information is lost when the mouse button is released. This means that if you finish dragging while the shape is collapsed, you may not be able to restore it to its original state. In such a case, please use the "undo" function.
-#### Reuse pose image
-Pose image generated by this tool has pose data in the image itself. You can reuse pose information by loading it as the image source instead of a regular image.
-""")
-    with gr.Column(scale=2):
-      html = gr.HTML(html_text)
-      with gr.Row():
-        with gr.Column(scale=1, min_width=60):
-          saveBtn = gr.Button(value="Save")
-        with gr.Column(scale=7):
-          gr.Markdown("""
-- "ctrl + drag" to **scale**
-- "alt + drag" to **move**
-- "shift + drag" to **rotate** (move right first, release shift, then up or down)
-- "space + drag" to **range-move**
-- "[", "]" or "Alt + wheel" or "Space + wheel" to shrink or expand **range**
-- "ctrl + Z", "shift + ctrl + Z" to **undo**, **redo**
-- "ctrl + E" **add** new person
-- "D + click" to **delete** person
-- "Q + click" to **cut off** limb
-- "X + drag" to **x-axis** pseudo-3D rotation
-- "C + drag" to **y-axis** pseudo-3D rotation
-- "R + click" to **repair**
-When using Q, X, C, R, pressing and dont release until the operation is complete.
-[Contact us for feature requests or bug reports (anonymous)](https://t.co/UC3jJOJJtS)
-""")
-  width.change(fn=None, inputs=[width], _js="(w) => { resizeCanvas(w,null); }")
-  height.change(fn=None, inputs=[height], _js="(h) => { resizeCanvas(null,h); }")
-  source.change(
-    fn = image_changed,
-    inputs = [source],
-    outputs = [estimationResult, json])
-  applySizeBtn.click(
-    fn = lambda x: (x.width, x.height),
-    inputs = [source],
-    outputs = [width, height])
-  replaceBtn.click(
-    fn = None,
-    inputs = [json],
-    outputs = [],
-    _js="(json) => { initializeEditor(); importPose(json); return []; }")
-  importBtn.click(
-    fn = None,
-    inputs = [json],
-    outputs = [],
-    _js="(json) => { importPose(json); return []; }")
-  saveBtn.click(
-    fn = None,
-    inputs = [], outputs = [json],
-    _js="() => { return [savePose()]; }")
-  jsonSource.change(
-    fn = lambda x: x,
-    inputs = [jsonSource], outputs = [json])
-  replaceWithJsonBtn.click(
-    fn = None,
-    inputs = [json],
-    outputs = [],
-    _js="(json) => { initializeEditor(); importPose(json); return []; }")
-  importJsonBtn.click(
-    fn = None,
-    inputs = [json],
-    outputs = [],
-    _js="(json) => { importPose(json); return []; }")
-  demo.load(fn=None, inputs=[], outputs=[], _js="() => { initializeEditor(); importPose(); return []; }")
-gr.mount_gradio_app(app, demo, path="/")

+import gradio as gr
+import numpy as np
+import cv2
+from fastapi import FastAPI, Request, Response
+from src.body import Body
+import json as js
+import requests
+import os
+from typing import Dict, List, Tuple
+import asyncio
+import aiohttp
+# Initialize body estimation model
+body_estimation = Body('model/body_pose_model.pth')
+# Fireworks AI configuration
+FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY", "YOUR_API_KEY_HERE")
+FIREWORKS_API_URL = "https://api.fireworks.ai/inference/v1/chat/completions"
+# OpenPose keypoint definitions
+BODY_PARTS = {
+    "Nose": 0, "Neck": 1, "RShoulder": 2, "RElbow": 3, "RWrist": 4,
+    "LShoulder": 5, "LElbow": 6, "LWrist": 7, "RHip": 8, "RKnee": 9,
+    "RAnkle": 10, "LHip": 11, "LKnee": 12, "LAnkle": 13, "REye": 14,
+    "LEye": 15, "REar": 16, "LEar": 17
+}
+# Pose templates for common positions
+POSE_TEMPLATES = {
+    "standing": {
+        "keypoints": {
+            "Neck": [256, 120],
+            "RShoulder": [220, 140], "RElbow": [200, 200], "RWrist": [190, 260],
+            "LShoulder": [292, 140], "LElbow": [312, 200], "LWrist": [322, 260],
+            "RHip": [230, 280], "RKnee": [225, 380], "RAnkle": [220, 480],
+            "LHip": [282, 280], "LKnee": [287, 380], "LAnkle": [292, 480]
+        }
+    },
+    "sitting": {
+        "keypoints": {
+            "Neck": [256, 180],
+            "RShoulder": [220, 200], "RElbow": [200, 260], "RWrist": [190, 320],
+            "LShoulder": [292, 200], "LElbow": [312, 260], "LWrist": [322, 320],
+            "RHip": [230, 340], "RKnee": [225, 400], "RAnkle": [280, 420],
+            "LHip": [282, 340], "LKnee": [287, 400], "LAnkle": [232, 420]
+        }
+    },
+    "running": {
+        "keypoints": {
+            "Neck": [256, 120],
+            "RShoulder": [220, 140], "RElbow": [180, 180], "RWrist": [150, 220],
+            "LShoulder": [292, 140], "LElbow": [332, 180], "LWrist": [362, 140],
+            "RHip": [230, 280], "RKnee": [260, 380], "RAnkle": [290, 470],
+            "LHip": [282, 280], "LKnee": [252, 360], "LAnkle": [222, 440]
+        }
+    }
+}
+def pil2cv(image):
+    '''PIL型 -> OpenCV型'''
+    new_image = np.array(image, dtype=np.uint8)
+    if new_image.ndim == 2:  # モノクロ
+        pass
+    elif new_image.shape[2] == 3:  # カラー
+        new_image = cv2.cvtColor(new_image, cv2.COLOR_RGB2BGR)
+    elif new_image.shape[2] == 4:  # 透過
+        new_image = cv2.cvtColor(new_image, cv2.COLOR_RGBA2BGRA)
+    return new_image
+async def generate_pose_from_llm(prompt: str) -> Dict:
+    """
+    LLM을 사용하여 텍스트 프롬프트로부터 포즈 데이터를 생성
+    """
+    system_prompt = """You are an expert in human pose generation. Given a description, generate precise OpenPose keypoint coordinates.
+    Rules:
+    1. Canvas size is 512x512 pixels
+    2. Return JSON with 18 keypoints (0-17)
+    3. Each keypoint has [x, y, confidence] where confidence is always 1.0
+    4. Maintain anatomically correct proportions
+    5. Center the pose in the canvas
+    Keypoint indices:
+    0: Nose, 1: Neck, 2: Right Shoulder, 3: Right Elbow, 4: Right Wrist,
+    5: Left Shoulder, 6: Left Elbow, 7: Left Wrist, 8: Right Hip, 9: Right Knee,
+    10: Right Ankle, 11: Left Hip, 12: Left Knee, 13: Left Ankle, 14: Right Eye,
+    15: Left Eye, 16: Right Ear, 17: Left Ear
+    Return ONLY valid JSON in this format:
+    {
+        "candidate": [[x, y, confidence], ...],
+        "subset": [[indices of connected keypoints, score, number of keypoints]]
+    }"""
+    headers = {
+        "Accept": "application/json",
+        "Content-Type": "application/json",
+        "Authorization": f"Bearer {FIREWORKS_API_KEY}"
+    }
+    payload = {
+        "model": "accounts/fireworks/models/qwen3-235b-a22b-instruct-2507",
+        "max_tokens": 2048,
+        "temperature": 0.3,
+        "messages": [
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": f"Generate OpenPose keypoints for: {prompt}"}
+        ]
+    }
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.post(FIREWORKS_API_URL, headers=headers, json=payload) as response:
+                if response.status == 200:
+                    data = await response.json()
+                    content = data['choices'][0]['message']['content']
+                    # Extract JSON from response
+                    import re
+                    json_match = re.search(r'\{.*\}', content, re.DOTALL)
+                    if json_match:
+                        pose_data = js.loads(json_match.group())
+                        return pose_data
+                    else:
+                        # Fallback to template
+                        return generate_template_pose(prompt)
+                else:
+                    return generate_template_pose(prompt)
+    except Exception as e:
+        print(f"LLM Error: {e}")
+        return generate_template_pose(prompt)
+def generate_template_pose(prompt: str) -> Dict:
+    """
+    템플릿 기반 포즈 생성 (LLM 실패 시 폴백)
+    """
+    prompt_lower = prompt.lower()
+    # Detect pose type from prompt
+    if any(word in prompt_lower for word in ["sit", "sitting", "seated", "chair"]):
+        template = POSE_TEMPLATES["sitting"]
+    elif any(word in prompt_lower for word in ["run", "running", "jog", "sprint"]):
+        template = POSE_TEMPLATES["running"]
+    else:
+        template = POSE_TEMPLATES["standing"]
+    # Convert template to OpenPose format
+    candidate = []
+    for i in range(18):
+        if i == 0:  # Nose
+            candidate.append([256, 100, 1.0])
+        elif part_name := next((k for k, v in BODY_PARTS.items() if v == i), None):
+            if part_name in template["keypoints"]:
+                x, y = template["keypoints"][part_name]
+                candidate.append([x, y, 1.0])
+            else:
+                # Estimate position based on nearby keypoints
+                candidate.append([256, 256, 0.0])
+        else:
+            candidate.append([0, 0, 0.0])
+    # Create subset (connection information)
+    subset = [[i for i in range(18) if candidate[i][2] > 0] + [18.0, 18]]
+    return {"candidate": candidate, "subset": subset}
+def refine_pose_with_llm(current_pose: Dict, refinement_prompt: str) -> Dict:
+    """
+    LLM을 사용하여 기존 포즈를 세밀하게 조정
+    """
+    system_prompt = """You are an expert in pose refinement. Given current pose data and adjustment instructions,
+    modify the keypoints precisely while maintaining anatomical correctness.
+    Return the modified pose in the same JSON format."""
+    headers = {
+        "Accept": "application/json",
+        "Content-Type": "application/json",
+        "Authorization": f"Bearer {FIREWORKS_API_KEY}"
+    }
+    payload = {
+        "model": "accounts/fireworks/models/qwen3-235b-a22b-instruct-2507",
+        "max_tokens": 2048,
+        "temperature": 0.2,
+        "messages": [
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": f"Current pose: {js.dumps(current_pose)}\nAdjustment needed: {refinement_prompt}"}
+        ]
+    }
+    try:
+        response = requests.post(FIREWORKS_API_URL, headers=headers, json=payload)
+        if response.status_code == 200:
+            data = response.json()
+            content = data['choices'][0]['message']['content']
+            import re
+            json_match = re.search(r'\{.*\}', content, re.DOTALL)
+            if json_match:
+                return js.loads(json_match.group())
+    except Exception as e:
+        print(f"Refinement error: {e}")
+    return current_pose
+# FastAPI setup
+with open("static/poseEditor.js", "r") as f:
+    file_contents = f.read()
+app = FastAPI()
+@app.middleware("http")
+async def some_fastapi_middleware(request: Request, call_next):
+    path = request.scope['path']
+    response = await call_next(request)
+    if path == "/":
+        response_body = ""
+        async for chunk in response.body_iterator:
+            response_body += chunk.decode()
+        some_javascript = f"""
+        <script type="text/javascript" defer>
+{file_contents}
+        </script>
+        """
+        response_body = response_body.replace("</body>", some_javascript + "</body>")
+        del response.headers["content-length"]
+        return Response(
+            content=response_body,
+            status_code=response.status_code,
+            headers=dict(response.headers),
+            media_type=response.media_type
+        )
+    return response
+def candidate_to_json_string(arr):
+    a = [f'[{x:.2f}, {y:.2f}]' for x, y, *_ in arr]
+    return '[' + ', '.join(a) + ']'
+def subset_to_json_string(arr):
+    arr_str = ','.join(['[' + ','.join([f'{num:.2f}' for num in row]) + ']' for row in arr])
+    return '[' + arr_str + ']'
+def estimate_body(source):
+    if source == None:
+        return None
+    candidate, subset = body_estimation(pil2cv(source))
+    return "{ \"candidate\": " + candidate_to_json_string(candidate) + ", \"subset\": " + subset_to_json_string(subset) + " }"
+def image_changed(image):
+    if image == None:
+        return "estimation", {}
+    if 'openpose' in image.info:
+        print("pose found")
+        jsonText = image.info['openpose']
+        jsonObj = js.loads(jsonText)
+        subset = jsonObj['subset']
+        return f"""{image.width}px x {image.height}px, {len(subset)} individual(s)""", jsonText
+    else:
+        print("pose not found")
+        candidate, subset = body_estimation(pil2cv(image))
+        jsonText = "{ \"candidate\": " + candidate_to_json_string(candidate) + ", \"subset\": " + subset_to_json_string(subset) + " }"
+        return f"""{image.width}px x {image.height}px, {subset.shape[0]} individual(s)""", jsonText
+async def generate_pose_from_text(prompt: str, use_llm: bool = True):
+    """
+    텍스트 프롬프트로부터 포즈 생성
+    """
+    if use_llm and FIREWORKS_API_KEY != "YOUR_API_KEY_HERE":
+        pose_data = await generate_pose_from_llm(prompt)
+    else:
+        pose_data = generate_template_pose(prompt)
+    # Format for the pose editor
+    if isinstance(pose_data['candidate'], list):
+        candidate_str = candidate_to_json_string(pose_data['candidate'])
+    else:
+        candidate_str = js.dumps(pose_data['candidate'])
+    if isinstance(pose_data['subset'], list):
+        subset_str = subset_to_json_string(pose_data['subset'])
+    else:
+        subset_str = js.dumps(pose_data['subset'])
+    return "{ \"candidate\": " + candidate_str + ", \"subset\": " + subset_str + " }"
+html_text = f"""
+    <canvas id="canvas" width="512" height="512"></canvas>
+    <script type="text/javascript" defer>{file_contents}</script>
+    """
+# Gradio interface
+with gr.Blocks(css="""
+    button { min-width: 80px; }
+    .prompt-box { border: 2px solid #667eea; border-radius: 8px; padding: 10px; }
+    .llm-status { color: #667eea; font-weight: bold; }
+    """) as demo:
+    gr.Markdown("""
+    # 🎨 AI-Powered Pose Generator with LLM
+    ### Generate precise line art poses from text descriptions using advanced AI
+    """)
+    with gr.Row():
+        with gr.Column(scale=1):
+            width = gr.Slider(label="Width", minimum=512, maximum=1024, step=64, value=512, interactive=True)
+            height = gr.Slider(label="Height", minimum=512, maximum=1024, step=64, value=512, interactive=True)
+            # LLM Pose Generation Section
+            with gr.Accordion(label="🤖 AI Pose Generation", open=True):
+                prompt_input = gr.Textbox(
+                    label="Describe the pose",
+                    placeholder="e.g., 'A person sitting cross-legged in meditation pose' or 'Someone running with arms pumping'",
+                    lines=3,
+                    elem_classes=["prompt-box"]
+                )
+                with gr.Row():
+                    use_llm_checkbox = gr.Checkbox(label="Use Advanced LLM", value=True)
+                    llm_status = gr.Markdown("", elem_classes=["llm-status"])
+                with gr.Row():
+                    generate_btn = gr.Button("🎯 Generate Pose", variant="primary")
+                    refine_btn = gr.Button("✨ Refine Current", variant="secondary")
+                refinement_prompt = gr.Textbox(
+                    label="Refinement instructions",
+                    placeholder="e.g., 'Raise the left arm higher' or 'Bend the knees more'",
+                    lines=2,
+                    visible=False
+                )
+                gr.Examples(
+                    examples=[
+                        "A person standing with arms raised in victory",
+                        "Someone sitting at a desk typing on a keyboard",
+                        "A dancer in arabesque position with one leg extended",
+                        "A person doing a yoga warrior pose",
+                        "Someone crouching in a ready position",
+                        "A person walking casually with relaxed posture"
+                    ],
+                    inputs=prompt_input
+                )
+            with gr.Accordion(label="📸 Pose Estimation from Image", open=False):
+                source = gr.Image(type="pil")
+                estimationResult = gr.Markdown("""estimation""")
+                with gr.Row():
+                    with gr.Column(min_width=80):
+                        applySizeBtn = gr.Button(value="Apply size")
+                    with gr.Column(min_width=80):
+                        replaceBtn = gr.Button(value="Replace")
+                    with gr.Column(min_width=80):
+                        importBtn = gr.Button(value="Import")
+            with gr.Accordion(label="📋 Json Data", open=False):
+                with gr.Row():
+                    with gr.Column(min_width=80):
+                        replaceWithJsonBtn = gr.Button(value="Replace")
+                    with gr.Column(min_width=80):
+                        importJsonBtn = gr.Button(value="Import")
+                gr.Markdown("""
+                | Action   | Instructions |
+                |----------|-------------|
+                | Import   | Paste JSON and click "Replace" or "Import" |
+                | Export   | Click "Save" to get pose data |
+                """)
+                json = gr.JSON(label="Json")
+                jsonSource = gr.Textbox(label="Json source", lines=10)
+            with gr.Accordion(label="📝 Notes & Controls", open=False):
+                gr.Markdown("""
+                #### Keyboard Controls
+                - **Ctrl + Drag**: Scale
+                - **Alt + Drag**: Move
+                - **Shift + Drag**: Rotate
+                - **Space + Drag**: Range move
+                - **Ctrl + Z/Shift + Ctrl + Z**: Undo/Redo
+                - **Ctrl + E**: Add person
+                - **D + Click**: Delete person
+                - **Q + Click**: Cut off limb
+                - **X/C + Drag**: 3D rotation
+                - **R + Click**: Repair
+                #### LLM Features
+                - Generate complex poses from natural language
+                - Refine existing poses with specific instructions
+                - Anatomically accurate keypoint generation
+                """)
+        with gr.Column(scale=2):
+            html = gr.HTML(html_text)
+            with gr.Row():
+                with gr.Column(scale=1, min_width=60):
+                    saveBtn = gr.Button(value="💾 Save")
+                with gr.Column(scale=7):
+                    generation_status = gr.Markdown("Ready to generate poses...")
+    # Event handlers
+    width.change(fn=None, inputs=[width], _js="(w) => { resizeCanvas(w,null); }")
+    height.change(fn=None, inputs=[height], _js="(h) => { resizeCanvas(null,h); }")
+    source.change(
+        fn=image_changed,
+        inputs=[source],
+        outputs=[estimationResult, json]
+    )
+    applySizeBtn.click(
+        fn=lambda x: (x.width, x.height),
+        inputs=[source],
+        outputs=[width, height]
+    )
+    replaceBtn.click(
+        fn=None,
+        inputs=[json],
+        outputs=[],
+        _js="(json) => { initializeEditor(); importPose(json); return []; }"
+    )
+    importBtn.click(
+        fn=None,
+        inputs=[json],
+        outputs=[],
+        _js="(json) => { importPose(json); return []; }"
+    )
+    # LLM generation events
+    async def handle_generate(prompt, use_llm):
+        if not prompt:
+            return None, "⚠️ Please enter a pose description"
+        try:
+            status = "🔄 Generating pose with AI..." if use_llm else "🔄 Using template..."
+            yield None, status
+            pose_json = await generate_pose_from_text(prompt, use_llm)
+            yield pose_json, "✅ Pose generated successfully!"
+        except Exception as e:
+            yield None, f"❌ Error: {str(e)}"
+    generate_btn.click(
+        fn=handle_generate,
+        inputs=[prompt_input, use_llm_checkbox],
+        outputs=[json, generation_status]
+    ).then(
+        fn=None,
+        inputs=[json],
+        outputs=[],
+        _js="(json) => { if(json) { initializeEditor(); importPose(json); } return []; }"
+    )
+    def toggle_refinement():
+        return gr.update(visible=True)
+    refine_btn.click(
+        fn=toggle_refinement,
+        outputs=[refinement_prompt]
+    )
+    async def handle_refine(current_json, refinement):
+        if not current_json or not refinement:
+            return None, "⚠️ Need current pose and refinement instructions"
+        try:
+            refined = refine_pose_with_llm(current_json, refinement)
+            return refined, "✅ Pose refined!"
+        except Exception as e:
+            return current_json, f"❌ Refinement error: {str(e)}"
+    refinement_prompt.submit(
+        fn=handle_refine,
+        inputs=[json, refinement_prompt],
+        outputs=[json, generation_status]
+    ).then(
+        fn=None,
+        inputs=[json],
+        outputs=[],
+        _js="(json) => { if(json) { importPose(json); } return []; }"
+    )
+    saveBtn.click(
+        fn=None,
+        inputs=[],
+        outputs=[json],
+        _js="() => { return [savePose()]; }"
+    )
+    jsonSource.change(
+        fn=lambda x: x,
+        inputs=[jsonSource],
+        outputs=[json]
+    )
+    replaceWithJsonBtn.click(
+        fn=None,
+        inputs=[json],
+        outputs=[],
+        _js="(json) => { initializeEditor(); importPose(json); return []; }"
+    )
+    importJsonBtn.click(
+        fn=None,
+        inputs=[json],
+        outputs=[],
+        _js="(json) => { importPose(json); return []; }"
+    )
+    demo.load(
+        fn=None,
+        inputs=[],
+        outputs=[],
+        _js="() => { initializeEditor(); importPose(); return []; }"
+    )
+    # Check API key status on load
+    def check_api_status():
+        if FIREWORKS_API_KEY == "YOUR_API_KEY_HERE":
+            return "⚠️ LLM API key not configured - using templates"
+        return "✅ LLM ready"
+    demo.load(fn=check_api_status, outputs=[llm_status])
+gr.mount_gradio_app(app, demo, path="/")