Spaces:

hasanbasbunar
/

Nano-Vision-Studio

Runtime error

App Files Files Community

hasanbasbunar commited on Nov 23, 2025

Commit

2f5cada

verified ·

1 Parent(s): 4083450

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -9

app.py CHANGED Viewed

@@ -138,7 +138,7 @@ def generate_studio(prompt, model_ui, ratio, resolution, grounding, user_api_key
     except Exception as e:
         raise gr.Error(f"API Error: {str(e)}")
-def generate_composition(prompt, files, model_ui, ratio, resolution, user_api_key):
     """Composition I2I (Supporte jusqu'à 14 images selon la doc)"""
     cli = get_client(user_api_key)
     model_name = MODELS[model_ui]
@@ -158,6 +158,9 @@ def generate_composition(prompt, files, model_ui, ratio, resolution, user_api_ke
         img_conf["image_size"] = resolution
         # <--- AJOUT : Activation du Thinking Mode aussi ici par sécurité
         gen_conf["thinking_config"] = types.ThinkingConfig(include_thoughts=True)
     gen_conf["image_config"] = types.ImageConfig(**img_conf)
@@ -182,7 +185,7 @@ def generate_composition(prompt, files, model_ui, ratio, resolution, user_api_ke
 # --- CHAT LOGIC ---
-def chat_respond(message, history, chat_history_data, img_input, model_ui, grounding, user_api_key):
     """Gestion du chat 'Stateless' conforme aux types Google GenAI"""
     if not user_api_key: raise gr.Error("API Key manquante")
@@ -193,7 +196,11 @@ def chat_respond(message, history, chat_history_data, img_input, model_ui, groun
     tools = None
     thinking_conf = None # <--- AJOUT variable
     if "gemini-3" in model_name:
         # <--- AJOUT : Config Thinking
         thinking_conf = types.ThinkingConfig(include_thoughts=True)
         if grounding:
@@ -205,7 +212,8 @@ def chat_respond(message, history, chat_history_data, img_input, model_ui, groun
         config=types.GenerateContentConfig(
             response_modalities=['TEXT', 'IMAGE'],
             tools=tools,
-            thinking_config=thinking_conf # <--- AJOUT
         ),
         history=chat_history_data
     )
@@ -269,12 +277,12 @@ def chat_respond(message, history, chat_history_data, img_input, model_ui, groun
         new_ui_history = history + [user_message_obj] + bot_messages
-        return "", new_ui_history, new_gemini_history, f_imgs
     except Exception as e:
         err_msg = f"❌ Error: {str(e)}"
         bot_err_obj = {"role": "assistant", "content": err_msg}
-        return "", history + [user_message_obj, bot_err_obj], chat_history_data, []
 def clear_chat():
     return [], None, []
@@ -328,7 +336,7 @@ with gr.Blocks(title="Nano Vision Studio") as demo:
                     t1_text = gr.Markdown(label="Generated Text")
                     with gr.Accordion("🧠 Thought Process", open=False):
                         t1_thought_imgs = gr.Gallery(label="Visual Drafts", columns=4, height=150)
-                        # t1_thought_txt = gr.Textbox(label="Thought Stream", interactive=False, lines=4)
                         t1_thought_txt = gr.Markdown(label="Thought Stream")
             t1_btn.click(
@@ -348,6 +356,7 @@ with gr.Blocks(title="Nano Vision Studio") as demo:
                         with gr.Row():
                             t2_ratio = gr.Dropdown(RATIOS, value="1:1", label="Aspect Ratio")
                             t2_res = gr.Dropdown(RESOLUTIONS, value="1K", label="Output Resolution")
                     t2_btn = gr.Button("Run", variant="primary")
                 with gr.Column(scale=2):
@@ -356,7 +365,7 @@ with gr.Blocks(title="Nano Vision Studio") as demo:
             t2_btn.click(
                 generate_composition,
-                inputs=[t2_prompt, t2_files, t2_model, t2_ratio, t2_res, user_api_key_state],
                 outputs=[t2_gallery, t2_text]
             )
@@ -374,6 +383,9 @@ with gr.Blocks(title="Nano Vision Studio") as demo:
                         clear_btn = gr.Button("🗑️ New Session")
                     with gr.Accordion("Chat Options", open=False):
                         c_model = gr.Dropdown(list(MODELS.keys()), value="🧠 Gemini 3 Pro Preview (Recommended)", label="Model")
                         c_grounding = gr.Checkbox(label="Grounding")
                 with gr.Column(scale=1):
@@ -381,8 +393,8 @@ with gr.Blocks(title="Nano Vision Studio") as demo:
             chat_btn.click(
                 chat_respond,
-                inputs=[chat_input, chat_history, chat_state, chat_img, c_model, c_grounding, user_api_key_state],
-                outputs=[chat_input, chat_history, chat_state, chat_gallery_zoom]
             )
             clear_btn.click(
                 clear_chat,

     except Exception as e:
         raise gr.Error(f"API Error: {str(e)}")
+def generate_composition(prompt, files, model_ui, ratio, resolution, grounding, user_api_key):
     """Composition I2I (Supporte jusqu'à 14 images selon la doc)"""
     cli = get_client(user_api_key)
     model_name = MODELS[model_ui]
         img_conf["image_size"] = resolution
         # <--- AJOUT : Activation du Thinking Mode aussi ici par sécurité
         gen_conf["thinking_config"] = types.ThinkingConfig(include_thoughts=True)
+        # <--- AJOUT : Grounding
+        if grounding:
+             gen_conf["tools"] = [{"google_search": {}}]
     gen_conf["image_config"] = types.ImageConfig(**img_conf)
 # --- CHAT LOGIC ---
+def chat_respond(message, history, chat_history_data, img_input, model_ui, grounding, ratio, resolution, user_api_key):
     """Gestion du chat 'Stateless' conforme aux types Google GenAI"""
     if not user_api_key: raise gr.Error("API Key manquante")
     tools = None
     thinking_conf = None # <--- AJOUT variable
+    # Configuration Image
+    img_conf = {"aspect_ratio": ratio}
     if "gemini-3" in model_name:
+        img_conf["image_size"] = resolution
         # <--- AJOUT : Config Thinking
         thinking_conf = types.ThinkingConfig(include_thoughts=True)
         if grounding:
         config=types.GenerateContentConfig(
             response_modalities=['TEXT', 'IMAGE'],
             tools=tools,
+            thinking_config=thinking_conf,
+            image_config=types.ImageConfig(**img_conf) # <--- AJOUT Image Config dans Chat
         ),
         history=chat_history_data
     )
         new_ui_history = history + [user_message_obj] + bot_messages
+        return "", None, new_ui_history, new_gemini_history, f_imgs
     except Exception as e:
         err_msg = f"❌ Error: {str(e)}"
         bot_err_obj = {"role": "assistant", "content": err_msg}
+        return "", None, history + [user_message_obj, bot_err_obj], chat_history_data, []
 def clear_chat():
     return [], None, []
                     t1_text = gr.Markdown(label="Generated Text")
                     with gr.Accordion("🧠 Thought Process", open=False):
                         t1_thought_imgs = gr.Gallery(label="Visual Drafts", columns=4, height=150)
+                        # Utilisation de Markdown pour un meilleur rendu du flux de pensée
                         t1_thought_txt = gr.Markdown(label="Thought Stream")
             t1_btn.click(
                         with gr.Row():
                             t2_ratio = gr.Dropdown(RATIOS, value="1:1", label="Aspect Ratio")
                             t2_res = gr.Dropdown(RESOLUTIONS, value="1K", label="Output Resolution")
+                        t2_grounding = gr.Checkbox(label="Google Search (Grounding)") # <--- AJOUT Grounding
                     t2_btn = gr.Button("Run", variant="primary")
                 with gr.Column(scale=2):
             t2_btn.click(
                 generate_composition,
+                inputs=[t2_prompt, t2_files, t2_model, t2_ratio, t2_res, t2_grounding, user_api_key_state],
                 outputs=[t2_gallery, t2_text]
             )
                         clear_btn = gr.Button("🗑️ New Session")
                     with gr.Accordion("Chat Options", open=False):
                         c_model = gr.Dropdown(list(MODELS.keys()), value="🧠 Gemini 3 Pro Preview (Recommended)", label="Model")
+                        with gr.Row():
+                            c_ratio = gr.Dropdown(RATIOS, value="16:9", label="Aspect Ratio") # <--- AJOUT Ratio
+                            c_res = gr.Dropdown(RESOLUTIONS, value="2K", label="Resolution (Pro only)") # <--- AJOUT Resolution
                         c_grounding = gr.Checkbox(label="Grounding")
                 with gr.Column(scale=1):
             chat_btn.click(
                 chat_respond,
+                inputs=[chat_input, chat_history, chat_state, chat_img, c_model, c_grounding, c_ratio, c_res, user_api_key_state],
+                outputs=[chat_input, chat_img, chat_history, chat_state, chat_gallery_zoom]
             )
             clear_btn.click(
                 clear_chat,