Spaces:

stepfun-ai
/

Step3-VL-10B

Running

App Files Files Community

Kangheng commited on Jan 19

Commit

0cd9e2d

verified ·

1 Parent(s): bbbfa1c

update app

Browse files

Files changed (1) hide show

app.py +6 -19

app.py CHANGED Viewed

@@ -239,14 +239,9 @@ def _extract_text_content(content) -> Optional[str]:
     return None
-def format_messages(system, history, user_text, image: Optional[Image.Image] = None):
     """Format message list for Step3-VL-10B."""
     messages: List[dict] = []
-    if system:
-        messages.append({
-            "role": "system",
-            "content": [{"type": "text", "text": system}]
-        })
     if not history:
         history = []
@@ -311,7 +306,7 @@ def build_user_display(image_url: Optional[str], user_text: Optional[str]) -> st
 @spaces.GPU
-def chat(system_prompt, user_text, image_file, history, max_tokens, temperature, top_p, show_thinking=True, model_name=None):
     """Chat function for Step3-VL-10B."""
     if model_name is None:
         model_name = MODEL_NAME
@@ -334,7 +329,7 @@ def chat(system_prompt, user_text, image_file, history, max_tokens, temperature,
     image = load_image(image_file)
     image_url = image_to_data_url(image) if image is not None else None
-    messages = format_messages(system_prompt, history, user_text, image)
     if not messages:
         yield history or [], "", None
         return
@@ -661,14 +656,6 @@ with gr.Blocks(title="Step3-VL-10B", css=custom_css, theme=gr.themes.Soft()) as
         with gr.Column(scale=1, min_width=350):
             # Configuration
             with gr.Accordion("⚙️ Configuration", open=False):
-                system_prompt = gr.Textbox(
-                    label="System Prompt",
-                    lines=2,
-                    value="You are a multimodal assistant with strong visual perception and reasoning.",
-                    placeholder="Enter system prompt...",
-                    elem_classes=["input-box"]
-                )
                 max_tokens = gr.Slider(
                     1, 56000,
                     value=16384,
@@ -677,13 +664,13 @@ with gr.Blocks(title="Step3-VL-10B", css=custom_css, theme=gr.themes.Soft()) as
                 )
                 temperature = gr.Slider(
                     0.0, 2.0,
-                    value=0.7,
                     label="Temperature",
                     info="Higher = more random"
                 )
                 top_p = gr.Slider(
                     0.0, 1.0,
-                    value=0.9,
                     label="Top P",
                     info="Nucleus sampling"
                 )
@@ -749,7 +736,7 @@ with gr.Blocks(title="Step3-VL-10B", css=custom_css, theme=gr.themes.Soft()) as
     submit_btn.click(
         fn=chat,
-        inputs=[system_prompt, user_text, image_file, chatbot, max_tokens, temperature, top_p, show_thinking],
         outputs=[chatbot, user_text, image_file]
     )

     return None
+def format_messages(history, user_text, image: Optional[Image.Image] = None):
     """Format message list for Step3-VL-10B."""
     messages: List[dict] = []
     if not history:
         history = []
 @spaces.GPU
+def chat(user_text, image_file, history, max_tokens, temperature, top_p, show_thinking=True, model_name=None):
     """Chat function for Step3-VL-10B."""
     if model_name is None:
         model_name = MODEL_NAME
     image = load_image(image_file)
     image_url = image_to_data_url(image) if image is not None else None
+    messages = format_messages(history, user_text, image)
     if not messages:
         yield history or [], "", None
         return
         with gr.Column(scale=1, min_width=350):
             # Configuration
             with gr.Accordion("⚙️ Configuration", open=False):
                 max_tokens = gr.Slider(
                     1, 56000,
                     value=16384,
                 )
                 temperature = gr.Slider(
                     0.0, 2.0,
+                    value=1.0,
                     label="Temperature",
                     info="Higher = more random"
                 )
                 top_p = gr.Slider(
                     0.0, 1.0,
+                    value=1.0,
                     label="Top P",
                     info="Nucleus sampling"
                 )
     submit_btn.click(
         fn=chat,
+        inputs=[user_text, image_file, chatbot, max_tokens, temperature, top_p, show_thinking],
         outputs=[chatbot, user_text, image_file]
     )