Spaces:

shenyugan
/

111

Sleeping

App Files Files Community

shenyugan commited on Apr 22, 2025

Commit

bb5a9dc

verified ·

1 Parent(s): 9a172c5

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -28

app.py CHANGED Viewed

@@ -246,24 +246,30 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
         * 语音输入优先于文本输入。如果同时提供了两者，将使用语音输入。
         * 模型加载和图像生成可能需要一些时间，尤其是在 CPU 或免费 Hugging Face Spaces 上。
         * 请确保已在 Space Secrets 中配置 OpenAI API Key (`OPENAI_API_KEY`)。
         """
-    )
     with gr.Row():
         with gr.Column(scale=1):
             # 输入控件
-            inp_short_prompt_text = gr.Textbox(label="输入简短描述 (例如：空中的魔法树屋)", info="如果使用语音输入，此项将被忽略")
-            inp_short_prompt_audio = gr.Audio(sources=["microphone"], type="filepath", label="或者，使用麦克风说出描述", info="优先于文本输入")
             # Gradio 控件使用要求 (至少三种)
             # 1. Textbox (上面已有)
             # 2. Audio (上面已有)
             # 3. Slider
-            inp_steps = gr.Slider(minimum=10, maximum=100, value=30, step=1, label="生成步数 (Steps)", info="步数越多细节可能越好，但耗时越长")
             # 4. Slider (另一个)
-            inp_scale = gr.Slider(minimum=1.0, maximum=20.0, value=7.5, step=0.5, label="引导系数 (Guidance Scale)", info="值越高，图像越贴合提示词，但可能降低创造性")
             # 5. Textbox (负面提示词)
-            inp_negative_prompt = gr.Textbox(label="负面提示词 (Negative Prompt)", value="ugly, blurry, low quality, deformed, text, words, signature", info="描述你不希望在图像中看到的内容")
             generate_button = gr.Button("✨ 生成图像", variant="primary")
@@ -277,42 +283,30 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
             out_image = gr.Image(label="生成的图像", type="pil", interactive=False) # 使用 PIL 格式
     # 将按钮点击连接到处理函数
-    # 使用 .then() 来链式调用，允许 UI 逐步更新
     generate_button.click(
         fn=process_input_and_generate,
         inputs=[inp_short_prompt_text, inp_short_prompt_audio, inp_negative_prompt, inp_steps, inp_scale],
         outputs=[out_final_short_prompt, out_detailed_prompt, out_image, status_output]
     )
-    # 添加一些示例
     gr.Examples(
         examples=[
             ["a magical treehouse in the sky", None, "blurry, low quality", 30, 7.5],
             ["photo of a cute cat wearing sunglasses", None, "cartoon, drawing, sketch", 35, 8.0],
             ["cyberpunk city street at night, raining", None, "daytime, bright sun", 40, 7.0],
         ],
         inputs=[inp_short_prompt_text, inp_short_prompt_audio, inp_negative_prompt, inp_steps, inp_scale],
-        outputs=[out_final_short_prompt, out_detailed_prompt, out_image, status_output], # Outputs should match the main function
-        fn=process_input_and_generate, # Use the main processing function
-        cache_examples=False, # Caching might be complex with generator functions
     )
 # --- 启动 Gradio 应用 ---
-if __name__ == "__main__":
-    # 如果没有配置 API Key，可能需要提示用户或退出
-    if not client:
-         print("\n错误：OpenAI API Key 未配置。请设置 OPENAI_API_KEY 环境变量或在代码中直接设置（不推荐）。")
-         print("程序将在 10 秒后退出...")
-         # time.sleep(10) # Optional delay
-         # exit() # Or let it run and show error in Gradio UI
-    # 检查模型是否加载成功
-    if not asr_pipeline:
-        print("\n警告：语音识别模型加载失败，语音输入功能将不可用。")
-    if not sd_pipeline:
-        print("\n警告：Stable Diffusion 模型加载失败，图像生成功能将不可用。")
-    # share=True 会创建一个公开链接（如果在本地运行）
-    # 在 Hugging Face Spaces 上运行时不需要 share=True
-    app.launch()

         * 语音输入优先于文本输入。如果同时提供了两者，将使用语音输入。
         * 模型加载和图像生成可能需要一些时间，尤其是在 CPU 或免费 Hugging Face Spaces 上。
         * 请确保已在 Space Secrets 中配置 OpenAI API Key (`OPENAI_API_KEY`)。
+        * **提示**: 语音输入优先于文本；生成步数影响细节和时间；引导系数控制与提示词的符合度；负面提示词排除不想要的内容。
         """
+    ) # Added essential info to the main markdown
     with gr.Row():
         with gr.Column(scale=1):
             # 输入控件
+            # REMOVED info argument
+            inp_short_prompt_text = gr.Textbox(label="输入简短描述 (例如：空中的魔法树屋)")
+            # REMOVED info argument
+            inp_short_prompt_audio = gr.Audio(sources=["microphone"], type="filepath", label="或者，使用麦克风说出描述")
             # Gradio 控件使用要求 (至少三种)
             # 1. Textbox (上面已有)
             # 2. Audio (上面已有)
             # 3. Slider
+            # REMOVED info argument
+            inp_steps = gr.Slider(minimum=10, maximum=100, value=30, step=1, label="生成步数 (Steps)")
             # 4. Slider (另一个)
+            # REMOVED info argument
+            inp_scale = gr.Slider(minimum=1.0, maximum=20.0, value=7.5, step=0.5, label="引导系数 (Guidance Scale)")
             # 5. Textbox (负面提示词)
+            # REMOVED info argument
+            inp_negative_prompt = gr.Textbox(label="负面提示词 (Negative Prompt)", value="ugly, blurry, low quality, deformed, text, words, signature")
             generate_button = gr.Button("✨ 生成图像", variant="primary")
             out_image = gr.Image(label="生成的图像", type="pil", interactive=False) # 使用 PIL 格式
     # 将按钮点击连接到处理函数
     generate_button.click(
         fn=process_input_and_generate,
         inputs=[inp_short_prompt_text, inp_short_prompt_audio, inp_negative_prompt, inp_steps, inp_scale],
         outputs=[out_final_short_prompt, out_detailed_prompt, out_image, status_output]
     )
+    # 添加一些示例 (确保 inputs/outputs 匹配修改后的组件)
     gr.Examples(
         examples=[
             ["a magical treehouse in the sky", None, "blurry, low quality", 30, 7.5],
             ["photo of a cute cat wearing sunglasses", None, "cartoon, drawing, sketch", 35, 8.0],
             ["cyberpunk city street at night, raining", None, "daytime, bright sun", 40, 7.0],
         ],
+        # Ensure the order of inputs here matches the inputs list in the .click() call
         inputs=[inp_short_prompt_text, inp_short_prompt_audio, inp_negative_prompt, inp_steps, inp_scale],
+        # Ensure the order of outputs here matches the outputs list in the .click() call
+        outputs=[out_final_short_prompt, out_detailed_prompt, out_image, status_output],
+        fn=process_input_and_generate,
+        cache_examples=False,
     )
 # --- 启动 Gradio 应用 ---
+# (The rest of your file remains the same)
+# if __name__ == "__main__":
+#    ... rest of the code ...
+#    app.launch()