import gradio as gr from shared.utils.plugins import WAN2GPPlugin import json from shared.deepy.engine import get_or_create_assistant_session from shared.gradio import assistant_chat from shared.deepy.config import ( DEEPY_CONTEXT_TOKENS_DEFAULT, DEEPY_CONTEXT_TOKENS_KEY, DEEPY_CUSTOM_SYSTEM_PROMPT_KEY, DEEPY_ENABLED_KEY, DEEPY_VRAM_MODE_KEY, DEEPY_VRAM_MODE_ALWAYS_LOADED, DEEPY_VRAM_MODE_UNLOAD, DEEPY_VRAM_MODE_UNLOAD_ON_REQUEST, deepy_available, format_deepy_context_tokens_label, deepy_requirement_message, normalize_deepy_context_tokens, normalize_deepy_custom_system_prompt, normalize_deepy_enabled, normalize_deepy_vram_mode, set_deepy_runtime_config, ) class ConfigTabPlugin(WAN2GPPlugin): def __init__(self): super().__init__() self.name = "Configuration Tab" self.version = "1.1.0" self.description = "Lets you adjust all your performance and UI options for WAN2GP" def setup_ui(self): self.request_global("args") self.request_global("server_config") self.request_global("server_config_filename") self.request_global("attention_mode") self.request_global("compile") self.request_global("default_profile_video") self.request_global("default_profile_image") self.request_global("default_profile_audio") self.request_global("vae_config") self.request_global("boost") self.request_global("enable_int8_kernels") self.request_global("preload_model_policy") self.request_global("transformer_quantization") self.request_global("transformer_dtype_policy") self.request_global("transformer_types") self.request_global("text_encoder_quantization") self.request_global("attention_modes_installed") self.request_global("attention_modes_supported") self.request_global("displayed_model_types") self.request_global("memory_profile_choices") self.request_global("attention_modes_choices") self.request_global("save_path") self.request_global("image_save_path") self.request_global("audio_save_path") self.request_global("quit_application") self.request_global("release_model") self.request_global("get_sorted_dropdown") self.request_global("app") self.request_global("fl") self.request_global("is_generation_in_progress") self.request_global("generate_header") self.request_global("generate_dropdown_model_list") self.request_global("get_unique_id") self.request_global("reset_prompt_enhancer") self.request_global("reset_prompt_enhancer_if_requested") self.request_global("release_deepy_vram") self.request_global("any_GPU_process_running") self.request_global("apply_int8_kernel_setting") self.request_component("model_description") self.request_component("header") self.request_component("model_family") self.request_component("model_base_type_choice") self.request_component("model_choice") self.request_component("refresh_form_trigger") self.request_component("state") self.request_component("resolution") self.request_component("assistant_launcher_host") self.request_component("assistant_panel") self.add_tab( tab_id="configuration", label="Configuration", component_constructor=self.create_config_ui, ) def create_config_ui(self): set_deepy_runtime_config(self.server_config, self.server_config_filename) with gr.Column(): with gr.Tabs(): with gr.Tab("General"): _, _, dropdown_choices = self.get_sorted_dropdown(self.displayed_model_types, None, None, False) self.transformer_types_choices = gr.Dropdown( choices=dropdown_choices, value=self.transformer_types, label="Selectable Generative Models (leave empty for all)", multiselect=True ) self.model_hierarchy_type_choice = gr.Dropdown( choices=[ ("Two Levels: Model Family > Models & Finetunes", 0), ("Three Levels: Model Family > Models > Finetunes", 1), ], value=self.server_config.get("model_hierarchy_type", 1), label="Models Hierarchy In User Interface", interactive=not self.args.lock_config ) self.fit_canvas_choice = gr.Dropdown( choices=[ ("Dimensions are Pixel Budget (preserves aspect ratio, may exceed dimensions)", 0), ("Dimensions are Max Width/Height (preserves aspect ratio, fits within box)", 1), ("Dimensions are Exact Output (crops input to fit exact dimensions)", 2), ], value=self.server_config.get("fit_canvas", 0), label="Input Image/Video Sizing Behavior", interactive=not self.args.lock_config ) self.attention_choice = gr.Dropdown( choices=self.attention_modes_choices, value=self.attention_mode, label="Attention Type", interactive=not self.args.lock_config ) self.preload_model_policy_choice = gr.CheckboxGroup( [("Preload Model on App Launch","P"), ("Preload Model on Switch", "S"), ("Unload Model when Queue is Done", "U")], value=self.preload_model_policy, label="Model Loading/Unloading Policy" ) self.clear_file_list_choice = gr.Dropdown( choices=[("None", 0), ("Keep last video", 1), ("Keep last 5 videos", 5), ("Keep last 10", 10), ("Keep last 20", 20), ("Keep last 30", 30)], value=self.server_config.get("clear_file_list", 5), label="Keep Previous Generations in Gallery" ) self.display_stats_choice = gr.Dropdown( choices=[("Disabled", 0), ("Enabled", 1)], value=self.server_config.get("display_stats", 0), label="Display real-time RAM/VRAM stats (requires restart)" ) self.max_frames_multiplier_choice = gr.Dropdown( choices=[("Default", 1), ("x2", 2), ("x3", 3), ("x4", 4), ("x5", 5), ("x6", 6), ("x7", 7)], value=self.server_config.get("max_frames_multiplier", 1), label="Max Frames / Duration Multiplier (requires restart)" ) self.enable_4k_resolutions_choice = gr.Dropdown( choices=[("Off", 0), ("On", 1)], value=self.server_config.get("enable_4k_resolutions", 0), label="3K/4K Resolutions" ) default_paths = self.fl.default_checkpoints_paths checkpoints_paths_text = "\n".join(self.server_config.get("checkpoints_paths", default_paths)) self.checkpoints_paths_choice = gr.Textbox( label="Model Checkpoint Folders (One Path per Line. First is Default Download Path)", value=checkpoints_paths_text, lines=3, interactive=not self.args.lock_config ) self.loras_root_choice = gr.Textbox( label="Loras Root Folder", value=self.server_config.get("loras_root", "loras"), interactive=not self.args.lock_config ) self.save_queue_if_crash_choice = gr.Dropdown( choices=[("Disabled", 0), ("Overwrite Last Error Queue", 1), ("Create a New Error Queue File", 2)], value=self.server_config.get("save_queue_if_crash", 1), label="Save Queue if Crash during Generation", interactive=not self.args.lock_config ) self.UI_theme_choice = gr.Dropdown( choices=[("Blue Sky (Default)", "default"), ("Classic Gradio", "gradio")], value=self.server_config.get("UI_theme", "default"), label="UI Theme (requires restart)" ) self.queue_color_scheme_choice = gr.Dropdown( choices=[ ("Pastel (Unique color for each item)", "pastel"), ("Alternating Grey Shades", "alternating_grey"), ], value=self.server_config.get("queue_color_scheme", "pastel"), label="Queue Color Scheme" ) with gr.Tab("Performance"): self.quantization_choice = gr.Dropdown(choices=[("Scaled Int8 (recommended)", "int8"), ("Scaled Fp8", "fp8"), ("16-bit (no quantization)", "bf16")], value=self.transformer_quantization, label="Transformer Model Quantization (if available otherwise get the closest available)") self.transformer_dtype_policy_choice = gr.Dropdown(choices=[("Auto (Best for Hardware)", ""), ("FP16", "fp16"), ("BF16", "bf16")], value=self.transformer_dtype_policy, label="Transformer Data Type (if available)") self.mixed_precision_choice = gr.Dropdown(choices=[("16-bit only (less VRAM)", "0"), ("Mixed 16/32-bit (better quality)", "1")], value=self.server_config.get("mixed_precision", "0"), label="Transformer Engine Precision") self.text_encoder_quantization_choice = gr.Dropdown(choices=[("16-bit (more RAM, better quality)", "bf16"), ("8-bit (less RAM, slightly lower quality)", "int8")], value=self.text_encoder_quantization, label="Text Encoder Quantization") self.lm_decoder_engine_choice = gr.Dropdown( choices=[ ("Auto", ""), ("PyTorch: slow, compatible", "legacy"), ("Cuda Graph: up to x6 faster, whole LM will be loaded in VRAM", "cg"), ("vllm: up to x10 faster, whole LM will be loaded in VRAM, requires Triton & Flash Attention 2", "vllm"), ], value=self.server_config.get("lm_decoder_engine", ""), label="Language Models Decoder Engine (when available for a model)", ) self.VAE_precision_choice = gr.Dropdown(choices=[("16-bit (faster, less VRAM)", "16"), ("32-bit (slower, better for sliding window)", "32")], value=self.server_config.get("vae_precision", "16"), label="VAE Encoding/Decoding Precision") self.compile_choice = gr.Dropdown(choices=[("On (up to 20% faster, requires Triton)", "transformer"), ("Off", "")], value=self.compile, label="Compile Transformer Model (slight speed again, but first generation is slower and potential compatibility issues with some GPUs/Models)", interactive=not self.args.lock_config) self.depth_anything_v2_variant_choice = gr.Dropdown(choices=[("Large (more precise, slower)", "vitl"), ("Big (less precise, faster)", "vitb")], value=self.server_config.get("depth_anything_v2_variant", "vitl"), label="Depth Anything v2 VACE Preprocessor") vae_config_value = self.vae_config if self.vae_config in [0, 1, 2, 3] else 0 self.vae_config_choice = gr.Dropdown( choices=[ ("Auto", 0), ("Spatial / Temporal Tiling Preset for 16GB+", 1), ("Spatial / Temporal Tiling Preset for 8GB+", 2), ("Spatial / Temporal Tiling Preset for 6GB+", 3), ], value=vae_config_value, label="VAE Tiling (higher presets use less VRAM and may increase artifacts like banding)", ) self.boost_choice = gr.Dropdown(choices=[("ON", 1), ("OFF", 2)], value=self.boost, label="Boost (~10% speedup for ~1GB VRAM)") self.enable_int8_kernels_choice = gr.Dropdown(choices=[("Disabled", 0), ("Enabled if Triton available", 1)], value=self.server_config.get("enable_int8_kernels", 1), label="Int8 Kernels (Experimental, 10% faster with INT8 quantized checkpoints, requires Triton)") self.video_profile_choice = gr.Dropdown( choices=self.memory_profile_choices, value=self.default_profile_video, label="Default Memory Profile (Video)", ) self.image_profile_choice = gr.Dropdown( choices=self.memory_profile_choices, value=self.default_profile_image, label="Default Memory Profile (Image)", ) self.audio_profile_choice = gr.Dropdown( choices=self.memory_profile_choices, value=self.default_profile_audio, label="Default Memory Profile (Audio)", ) self.preload_in_VRAM_choice = gr.Slider(0, 40000, value=self.server_config.get("preload_in_VRAM", 0), step=100, label="VRAM (MB) for Preloaded Models (0=profile default)") self.max_reserved_loras_choice = gr.Slider( -1, 10000, value=self.server_config.get("max_reserved_loras", -1), step=1, label="Max Amount of Loras (in MB) to be Pinned To Reserved Memory (set it to 0-500MB if Out of Memory when starting Gen, -1= No limit)" ) self.release_RAM_btn = gr.Button("Force Unload Models from RAM") with gr.Tab("Extensions"): mmaudio_mode_default = self.server_config.get("mmaudio_mode", None) mmaudio_persistence_default = self.server_config.get("mmaudio_persistence", None) if mmaudio_mode_default is None: legacy_mmaudio = self.server_config.get("mmaudio_enabled", 0) mmaudio_mode_default = 0 if legacy_mmaudio == 0 else 1 if mmaudio_persistence_default is None: legacy_mmaudio = self.server_config.get("mmaudio_enabled", 0) mmaudio_persistence_default = 2 if legacy_mmaudio == 2 else 1 self.mmaudio_mode_choice = gr.Dropdown( choices=[("Off", 0), ("Standard", 1), ("NSFW", 2)], value=mmaudio_mode_default, label="MMAudio Soundtrack Generation (requires 10GB extra download)" ) self.mmaudio_persistence_choice = gr.Dropdown( choices=[("Unload after use", 1), ("Persistent in RAM", 2)], value=mmaudio_persistence_default, label="MMAudio Model Persistence" ) self.rife_version_choice = gr.Dropdown( choices=[("RIFE HDv3 (default)", "v3"), ("RIFE v4.26 (latest)", "v4")], value=self.server_config.get("rife_version", "v4"), label="RIFE Temporal Upsampling Model", interactive=not self.args.lock_config ) self.matanyone_version_choice = gr.Dropdown( choices=[("MatAnyone v1 (original, default)", "v1"), ("MatAnyone v2", "v2")], value=self.server_config.get("matanyone_version", "v1"), label="MatAnyone Video Mask Model", interactive=not self.args.lock_config ) with gr.Tab("Prompt Enhancer / Deepy"): with gr.Group(): self.enhancer_enabled_choice = gr.Dropdown(choices=[("Off", 0), ("Florence 2 (image captioning) + LLama 3.2 3B (text generation)", 1), ("Florence 2 (image captioning) + Llama Joy 8B (uncensored, richer)", 2), ("Qwen3.5VL Abliterated 4B (captioning + uncensored text enhancement, vllm accelerated if available)", 3), ("Qwen3.5VL Abliterated 9B (captioning + uncensored high end text enhancement, vllm accelerated if available)", 4)], value=self.server_config.get("enhancer_enabled", 0), label="Prompt Enhancer (requires extra model files)") self.enhancer_quantization_choice = gr.Dropdown( choices=[("Quanto Int8 (better quality)", "quanto_int8"), ("GGUF Q4 (less VRAM/RAM & faster if kernels are installed, but worse quality)", "gguf")], value=self.server_config.get("prompt_enhancer_quantization", "quanto_int8"), label="Qwen3.5 LLM Quantization", ) self.enhancer_mode_choice = gr.Dropdown(choices=[("On-Demand Button Only", 1),("Automatic on Generation", 0)], value=self.server_config.get("enhancer_mode", 1), label="Prompt Enhancer Usage") with gr.Row(): self.prompt_enhancer_temperature_choice = gr.Slider( 0.1, 1.5, value=self.server_config.get("prompt_enhancer_temperature", 0.6), step=0.01, label="Prompt Enhancer Temperature (High = More Creativity)", interactive=not self.args.lock_config, ) self.prompt_enhancer_top_p_choice = gr.Slider( 0.1, 1.0, value=self.server_config.get("prompt_enhancer_top_p", 0.9), step=0.01, label="Prompt Enhancer Top-p (High = More Variety)", interactive=not self.args.lock_config, ) self.prompt_enhancer_randomize_seed_choice = gr.Checkbox( value=self.server_config.get("prompt_enhancer_randomize_seed", True), label="Randomize Prompt Enhancer Seed", interactive=not self.args.lock_config, ) self.deepy_enabled_choice = gr.Dropdown( choices=[("Off", 0), ("On", 1)], value=normalize_deepy_enabled(self.server_config.get(DEEPY_ENABLED_KEY, 0)), label="Enable Deepy", ) self.deepy_vram_mode_choice = gr.Dropdown( choices=[ ("Unload from VRAM as soon as possible", DEEPY_VRAM_MODE_UNLOAD), ("Unload from VRAM if VRAM requested by another WanGP component", DEEPY_VRAM_MODE_UNLOAD_ON_REQUEST), ("Always loaded in VRAM", DEEPY_VRAM_MODE_ALWAYS_LOADED), ], value=normalize_deepy_vram_mode(self.server_config.get(DEEPY_VRAM_MODE_KEY, DEEPY_VRAM_MODE_UNLOAD)), label="Deepy VRAM Loading Mode (the longer Deepy stays in VRAM, the faster Deeper is )", ) deepy_context_tokens_default = normalize_deepy_context_tokens(self.server_config.get(DEEPY_CONTEXT_TOKENS_KEY, DEEPY_CONTEXT_TOKENS_DEFAULT)) self.deepy_context_tokens_choice = gr.Slider( minimum=4096, maximum=256000, value=deepy_context_tokens_default, step=512, label=format_deepy_context_tokens_label(self.server_config.get("enhancer_enabled", 0), deepy_context_tokens_default), ) self.deepy_custom_system_prompt_choice = gr.Textbox( value=normalize_deepy_custom_system_prompt(self.server_config.get(DEEPY_CUSTOM_SYSTEM_PROMPT_KEY, "")), lines=6, label="Custom System Prompt", info="Added after the built-in Deepy system prompt on the next user interaction.", ) self.deepy_requirement_md = gr.Markdown(value=deepy_requirement_message(self.server_config)) with gr.Tab("Outputs"): self.video_output_codec_choice = gr.Dropdown(choices=[("x265 CRF 28 (Balanced)", 'libx265_28'), ("x264 Level 8 (Balanced)", 'libx264_8'), ("x265 CRF 8 (High Quality)", 'libx265_8'), ("x264 Level 10 (High Quality)", 'libx264_10'), ("x264 Lossless", 'libx264_lossless')], value=self.server_config.get("video_output_codec", "libx264_8"), label="Video Codec") self.image_output_codec_choice = gr.Dropdown(choices=[("JPEG Q85", 'jpeg_85'), ("WEBP Q85", 'webp_85'), ("JPEG Q95", 'jpeg_95'), ("WEBP Q95", 'webp_95'), ("WEBP Lossless", 'webp_lossless'), ("PNG Lossless", 'png')], value=self.server_config.get("image_output_codec", "jpeg_95"), label="Image Codec") self.audio_output_codec_choice = gr.Dropdown( choices=[ ("AAC 128 kbps", "aac_128"), ("AAC 192 kbps", "aac_192"), ("AAC 256 kbps (High Quality, Recommended)", "aac_256"), ("AAC 320 kbps (Very High Quality)", "aac_320"), ("ALAC Lossless (preview/playback compatibility may be limited)", "alac"), ], value=self.server_config.get("audio_output_codec", "aac_128"), visible=True, label="Audio Codec to use for mp4 container", ) audio_standalone_default = self.server_config.get("audio_stand_alone_output_codec", "wav") if audio_standalone_default == "mp3": audio_standalone_default = "mp3_192" self.audio_stand_alone_output_codec_choice = gr.Dropdown( choices=[ ("WAV (Lossless)", "wav"), ("MP3 128 kbps", "mp3_128"), ("MP3 192 kbps", "mp3_192"), ("MP3 320 kbps", "mp3_320"), ], value=audio_standalone_default, visible=True, label="Audio Codec to use for standalone audio files", ) self.metadata_choice = gr.Dropdown( choices=[("Export JSON files", "json"), ("Embed metadata in file (Exif/tag)", "metadata"), ("None", "none")], value=self.server_config.get("metadata_type", "metadata"), label="Metadata Handling" ) self.keep_intermediate_sliding_windows_choice = gr.Dropdown( choices=[("Yes", 1), ("No", 0)], value=self.server_config.get("keep_intermediate_sliding_windows", 1), label="Keep Intermediate Sliding Windows" ) self.embed_source_images_choice = gr.Checkbox( value=self.server_config.get("embed_source_images", False), label="Embed Source Images", info="Saves i2v source images inside MP4 files" ) self.video_save_path_choice = gr.Textbox(label="Video Output Folder (requires restart)", value=self.save_path) self.image_save_path_choice = gr.Textbox(label="Image Output Folder (requires restart)", value=self.image_save_path) self.audio_save_path_choice = gr.Textbox(label="Audio Output Folder (requires restart)", value=self.audio_save_path) with gr.Tab("Notifications"): self.notification_sound_enabled_choice = gr.Dropdown(choices=[("On", 1), ("Off", 0)], value=self.server_config.get("notification_sound_enabled", 0), label="Notification Sound") self.notification_sound_volume_choice = gr.Slider(0, 100, value=self.server_config.get("notification_sound_volume", 50), step=5, label="Notification Volume") self.msg = gr.Markdown() with gr.Row(): self.apply_btn = gr.Button("Save Settings") def update_deepy_requirement(enhancer_enabled_choice): runtime_config = dict(self.server_config) runtime_config["enhancer_enabled"] = enhancer_enabled_choice return deepy_requirement_message(runtime_config) self.enhancer_enabled_choice.input(fn=update_deepy_requirement, inputs=[self.enhancer_enabled_choice], outputs=[self.deepy_requirement_md], show_progress="hidden") def update_deepy_context_label(enhancer_enabled_choice, deepy_context_tokens_choice): return gr.update(label=format_deepy_context_tokens_label(enhancer_enabled_choice, deepy_context_tokens_choice)) self.enhancer_enabled_choice.input(fn=update_deepy_context_label, inputs=[self.enhancer_enabled_choice, self.deepy_context_tokens_choice], outputs=[self.deepy_context_tokens_choice], show_progress="hidden") self.deepy_context_tokens_choice.input(fn=update_deepy_context_label, inputs=[self.enhancer_enabled_choice, self.deepy_context_tokens_choice], outputs=[self.deepy_context_tokens_choice], show_progress="hidden") inputs = [ self.state, self.transformer_types_choices, self.model_hierarchy_type_choice, self.fit_canvas_choice, self.attention_choice, self.preload_model_policy_choice, self.clear_file_list_choice, self.keep_intermediate_sliding_windows_choice, self.display_stats_choice, self.max_frames_multiplier_choice, self.enable_4k_resolutions_choice, self.checkpoints_paths_choice, self.loras_root_choice, self.save_queue_if_crash_choice, self.UI_theme_choice, self.queue_color_scheme_choice, self.quantization_choice, self.transformer_dtype_policy_choice, self.mixed_precision_choice, self.text_encoder_quantization_choice, self.lm_decoder_engine_choice, self.VAE_precision_choice, self.compile_choice, self.depth_anything_v2_variant_choice, self.vae_config_choice, self.boost_choice, self.enable_int8_kernels_choice, self.video_profile_choice, self.image_profile_choice, self.audio_profile_choice, self.preload_in_VRAM_choice, self.max_reserved_loras_choice, self.enhancer_enabled_choice, self.enhancer_quantization_choice, self.enhancer_mode_choice, self.prompt_enhancer_temperature_choice, self.prompt_enhancer_top_p_choice, self.prompt_enhancer_randomize_seed_choice, self.mmaudio_mode_choice, self.mmaudio_persistence_choice, self.rife_version_choice, self.matanyone_version_choice, self.deepy_enabled_choice, self.deepy_vram_mode_choice, self.deepy_context_tokens_choice, self.deepy_custom_system_prompt_choice, self.video_output_codec_choice, self.image_output_codec_choice, self.audio_output_codec_choice, self.audio_stand_alone_output_codec_choice, self.metadata_choice, self.embed_source_images_choice, self.video_save_path_choice, self.image_save_path_choice, self.audio_save_path_choice, self.notification_sound_enabled_choice, self.notification_sound_volume_choice, self.resolution ] self.apply_btn.click( fn=self._save_changes, inputs=inputs, outputs=[ self.msg, self.model_description, self.header, self.model_family, self.model_base_type_choice, self.model_choice, self.refresh_form_trigger, self.assistant_launcher_host, self.assistant_panel ] ) def _unload_targets_text(): targets = ["Models"] try: enhancer_enabled = int(self.server_config.get("enhancer_enabled", 0) or 0) > 0 except Exception: enhancer_enabled = False if enhancer_enabled: targets.append("Prompt Enhancer") if deepy_available(self.server_config): targets.append("Deepy") if len(targets) == 1: return targets[0] return ", ".join(targets[:-1]) + f", and {targets[-1]}" if len(targets) > 2 else " and ".join(targets) def release_ram_and_notify(state): unload_targets = _unload_targets_text() if self.any_GPU_process_running(state, "configuration"): gr.Info(f"Unable to unload {unload_targets} while GPU resources are allocated.") return if deepy_available(self.server_config): self.release_deepy_vram(state, clear_session_state=False, discard_runtime_snapshot=True) if "Prompt Enhancer" in unload_targets: self.reset_prompt_enhancer() self.reset_prompt_enhancer_if_requested() self.release_model() gr.Info(f"{unload_targets} unloaded from RAM.") self.release_RAM_btn.click(fn=release_ram_and_notify, inputs=[self.state]) return [self.release_RAM_btn] def _save_changes(self, state, *args): gen_in_progress = self.is_generation_in_progress() # return "