wubby

Running

App Files Files

lainlives commited on Dec 10, 2025

Commit

88d335a

verified ·

1 Parent(s): 8fabd14

Update app.py

Browse files

Files changed (1) hide show

app.py +1008 -64

app.py CHANGED Viewed

@@ -28,7 +28,6 @@ from ultimate_rvc.core.manage.models import (
     get_voice_model_names,
 )
 from ultimate_rvc.web.common import initialize_dropdowns
-from ultimate_rvc.web.config.main import TotalConfig
 from ultimate_rvc.web.tabs.generate.song_cover.multi_step_generation import (
     render as render_song_cover_multi_step_tab,
 )
@@ -46,12 +45,284 @@ from ultimate_rvc.web.tabs.manage.models import render as render_models_tab
 from ultimate_rvc.web.tabs.manage.settings import render as render_settings_tab
 import sys
-from ultimate_rvc.web.main import start_app
 from huggingface_hub import snapshot_download
-from ultimate_rvc.core.manage.config import load_config
-from ultimate_rvc.web.config.main import SettingsManagementConfig, TotalConfig
 from enum import StrEnum
 embedders_list = [
     ("embedders/contentvec/", ["pytorch_model.bin", "config.json"]),
     ("embedders/custom/Crusty/", ["model.safetensors", "config.json"]),
@@ -114,48 +385,8 @@ class SeparationModel2(StrEnum):
     UVR_DeEcho_DeReverb = "UVR-DeEcho-DeReverb.pth"
-class ModelController:
-    """Manages the active model and provides a consistent interface."""
-    def __init__(self, initial_model):
-        self._model = initial_model
-        self._lock = threading.RLock() # Use a lock for thread safety
-    def get_model(self):
-        """Atomically get the current model instance."""
-        with self._lock:
-            # Return a copy if the model is mutable, to prevent modification issues
-            return copy.copy(self._model)
-    def set_model(self, new_model):
-        """Atomically set a new model instance."""
-        with self._lock:
-            self._model = new_model
-            print(f"--- Model updated to {new_model.__class__.__name__} ---")
-def periodic_updater(controller, interval_seconds, new_model_class, stop_event):
-    """
-    A function to run in a separate thread that periodically updates the model.
-    """
-    while not stop_event.is_set():
-        time.sleep(interval_seconds)
-        if not stop_event.is_set():
-            # Create a new instance of the desired class and set it
-            new_model = new_model_class()
-            controller.set_model(new_model)
-controller = ModelController(SeparationModel)
-stop_event = threading.Event()
-# Start the updater thread
-update_thread = threading.Thread(
-    target=periodic_updater,
-    args=(controller, 5, SeparationModel2, stop_event), # Update every 5 seconds to Model2
-    daemon=True # Daemon threads exit when the main program exits
-)
-update_thread.start()
-load_config("default", TotalConfig)
 now_dir = os.getcwd()
@@ -177,11 +408,723 @@ snapshot_download(repo_id=repo_id, local_dir=dump_path, token=hf_token)
-config_name = os.environ.get("URVC_CONFIG")
 cookiefile = os.environ.get("YT_COOKIEFILE")
 total_config = load_config(config_name, TotalConfig) if config_name else TotalConfig()
 def render_app() -> gr.Blocks:
     """
     Render the Ultimate RVC web application.
@@ -204,12 +1147,11 @@ def render_app() -> gr.Blocks:
     cache_delete_cutoff = 86400  # and delete files older than 24 hours
     with gr.Blocks(
-        title="Ultimate RVC",
         theme=gr.Theme.load(str(Path(__file__).parent / "config/theme.json")),
         css=css,
         delete_cache=(cache_delete_frequency, cache_delete_cutoff),
     ) as app:
-        gr.HTML("<h1>Ultimate RVC 💙</h1>")
         for component_config in [
             total_config.song.one_click.voice_model,
             total_config.song.one_click.cached_song,
@@ -247,19 +1189,20 @@ def render_app() -> gr.Blocks:
         ]:
             component_config.instantiate()
         # main tab
-        with gr.Tab("Generate", elem_id="generate-tab"):
-            with gr.Tab("Song covers"):
-                render_song_cover_one_click_tab(total_config, cookiefile)
-                render_song_cover_multi_step_tab(total_config, cookiefile)
-            with gr.Tab("Speech"):
-                render_speech_one_click_tab(total_config)
-                render_speech_multi_step_tab(total_config)
-        with gr.Tab("Models", elem_id="manage-tab"):
-            render_models_tab(total_config)
-        with gr.Tab("Audio", elem_id="audio-tab"):
-            render_audio_tab(total_config)
-        with gr.Tab("Settings", elem_id="settings-tab"):
-            render_settings_tab(total_config)
         app.load(
             _init_dropdowns,
@@ -392,7 +1335,7 @@ def start_app(
             "-h",
             help="The hostname that the server will use.",
         ),
-    ] = None,
     listen_port: Annotated[
         int | None,
         typer.Option(
@@ -412,14 +1355,15 @@ def start_app(
     """Run the Ultimate RVC web application."""
     os.environ["GRADIO_TEMP_DIR"] = str(TEMP_DIR)
     gr.set_static_paths([MODELS_DIR, AUDIO_DIR])
-    app.queue()
     app.launch(
-        share=share,
-        server_name=(None if not listen else (listen_host or "0.0.0.0")),  # noqa: S104
         server_port=listen_port,
         ssr_mode=ssr_mode,
     )
 if __name__ == "__main__":
     app_wrapper()

     get_voice_model_names,
 )
 from ultimate_rvc.web.common import initialize_dropdowns
 from ultimate_rvc.web.tabs.generate.song_cover.multi_step_generation import (
     render as render_song_cover_multi_step_tab,
 )
 from ultimate_rvc.web.tabs.manage.settings import render as render_settings_tab
 import sys
 from huggingface_hub import snapshot_download
 from enum import StrEnum
+from typing import TYPE_CHECKING, Any
+from functools import cached_property
+from pydantic import BaseModel
+from ultimate_rvc.web.config.component import (
+    AnyComponentConfig,
+    AudioConfig,
+    CheckboxConfig,
+    ComponentConfig,
+    DropdownConfig,
+    RadioConfig,
+    SliderConfig,
+)
+from ultimate_rvc.web.config.tab import (
+    SongGenerationConfig,
+    SpeechGenerationConfig,
+    TrainingConfig,
+)
+from typing import Any, TypedDict
+from collections.abc import Callable, Sequence
+from enum import StrEnum, auto
+if TYPE_CHECKING:
+    import gradio as gr
+type StrPath = str | PathLike[str]
+type Json = Mapping[str, Json] | Sequence[Json] | str | int | float | bool | None
+class SegmentSize(IntEnum):
+    """Enumeration of segment sizes for audio separation."""
+    SEG_64 = 64
+    SEG_128 = 128
+    SEG_256 = 256
+    SEG_512 = 512
+    SEG_1024 = 1024
+    SEG_2048 = 2048
+    SEG_4096 = 4096
+class F0Method(StrEnum):
+    """Enumeration of pitch extraction methods."""
+    RMVPE = "rmvpe"
+    CREPE = "crepe"
+    CREPE_TINY = "crepe-tiny"
+    FCPE = "fcpe"
+class RVCContentType(StrEnum):
+    """Enumeration of valid content to convert with RVC."""
+    VOCALS = "vocals"
+    VOICE = "voice"
+    SPEECH = "speech"
+    AUDIO = "audio"
+class SampleRate(IntEnum):
+    """Enumeration of supported audio sample rates."""
+    HZ_16000 = 16000
+    HZ_44100 = 44100
+    HZ_48000 = 48000
+    HZ_96000 = 96000
+    HZ_192000 = 192000
+class AudioExt(StrEnum):
+    """Enumeration of supported audio file formats."""
+    MP3 = "mp3"
+    WAV = "wav"
+    FLAC = "flac"
+    OGG = "ogg"
+class DeviceType(StrEnum):
+    """Enumeration of device types for training voice models."""
+    AUTOMATIC = "Automatic"
+    CPU = "CPU"
+    GPU = "GPU"
+class TrainingSampleRate(StrEnum):
+    """Enumeration of sample rates for training voice models."""
+    HZ_32K = "32000"
+    HZ_40K = "40000"
+    HZ_48K = "48000"
+class PretrainedSampleRate(StrEnum):
+    """Enumeration of valid sample rates for pretrained models."""
+    HZ_32K = "32k"
+    HZ_40K = "40k"
+    HZ_44K = "44k"
+    HZ_48K = "48k"
+class TrainingF0Method(StrEnum):
+    """Enumeration of pitch extraction methods for training."""
+    RMVPE = "rmvpe"
+    CREPE = "crepe"
+    CREPE_TINY = "crepe-tiny"
+class AudioSplitMethod(StrEnum):
+    """
+    Enumeration of methods to use for splitting audio files during
+    dataset preprocessing.
+    """
+    SKIP = "Skip"
+    SIMPLE = "Simple"
+    AUTOMATIC = "Automatic"
+class Vocoder(StrEnum):
+    """Enumeration of vocoders for training voice models."""
+    HIFI_GAN = "HiFi-GAN"
+    MRF_HIFI_GAN = "MRF HiFi-GAN"
+    REFINE_GAN = "RefineGAN"
+class IndexAlgorithm(StrEnum):
+    """Enumeration of indexing algorithms for training voice models."""
+    AUTO = "Auto"
+    FAISS = "Faiss"
+    KMEANS = "KMeans"
+class PretrainedType(StrEnum):
+    """
+    Enumeration of the possible types of pretrained models to finetune
+    voice models on.
+    """
+    NONE = "None"
+    DEFAULT = "Default"
+    CUSTOM = "Custom"
+class ConcurrencyId(StrEnum):
+    """Enumeration of possible concurrency identifiers."""
+    GPU = auto()
+class SongSourceType(StrEnum):
+    """The type of source providing the song to generate a cover of."""
+    LOCAL_FILE = "Local file"
+    CACHED_SONG = "Cached song"
+class SpeechSourceType(StrEnum):
+    """The type of source providing the text to generate speech from."""
+    TEXT = "Text"
+    LOCAL_FILE = "Local file"
+class SongTransferOption(StrEnum):
+    """Enumeration of possible song transfer options."""
+    STEP_1_AUDIO = "Step 1: stem splitting"
+    STEP_2_VOCALS = "Step 2: vocal conversion"
+    STEP_3_VOCALS = "Step 3: vocal effect"
+    STEP_4_INSTRUMENTALS = "Step 4: instrumentals"
+    STEP_4_BACKUP_VOCALS = "Step 4: backup vocals"
+    STEP_5_MAIN_VOCALS = "Step 5: main vocals"
+    STEP_5_INSTRUMENTALS = "Step 5: instrumentals"
+    STEP_5_BACKUP_VOCALS = "Step 5: backup vocals"
+class SpeechTransferOption(StrEnum):
+    """Enumeration of possible speech transfer options."""
+    STEP_2_SPEECH = "Step 2: vocal conversion"
+    STEP_3_SPEECH = "Step 3: vocal effect"
+class ComponentVisibilityKwArgs(TypedDict, total=False):
+    """
+    Keyword arguments for setting component visibility.
+    Attributes
+    ----------
+    visible : bool
+        Whether the component should be visible.
+    value : Any
+        The value of the component.
+    """
+    visible: bool
+    value: Any
+class UpdateDropdownKwArgs(TypedDict, total=False):
+    """
+    Keyword arguments for updating a dropdown component.
+    Attributes
+    ----------
+    choices : DropdownChoices
+        The updated choices for the dropdown component.
+    value : DropdownValue
+        The updated value for the dropdown component.
+    """
+    choices: DropdownChoices
+    value: DropdownValue
+class TextBoxKwArgs(TypedDict, total=False):
+    """
+    Keyword arguments for updating a textbox component.
+    Attributes
+    ----------
+    value : str | None
+        The updated value for the textbox component.
+    placeholder : str | None
+        The updated placeholder for the textbox component.
+    """
+    value: str | None
+    placeholder: str | None
+class UpdateAudioKwArgs(TypedDict, total=False):
+    """
+    Keyword arguments for updating an audio component.
+    Attributes
+    ----------
+    value : str | None
+        The updated value for the audio component.
+    """
+    value: str | None
+class DatasetType(StrEnum):
+    """The type of dataset to train a voice model."""
+    NEW_DATASET = "New dataset"
+    EXISTING_DATASET = "Existing dataset"
 embedders_list = [
     ("embedders/contentvec/", ["pytorch_model.bin", "config.json"]),
     ("embedders/custom/Crusty/", ["model.safetensors", "config.json"]),
     UVR_DeEcho_DeReverb = "UVR-DeEcho-DeReverb.pth"
 now_dir = os.getcwd()
+config_name = "default" #os.environ.get("URVC_CONFIG")
 cookiefile = os.environ.get("YT_COOKIEFILE")
 total_config = load_config(config_name, TotalConfig) if config_name else TotalConfig()
+"""
+Module defining models for representing configuration settings for
+UI tabs.
+"""
+from __future__ import annotations
+class SongIntermediateAudioConfig(BaseModel):
+    """
+    Configuration settings for intermediate audio components in the
+    one-click song generation tab.
+    Attributes
+    ----------
+    song : AudioConfig
+        Configuration settings for the input song audio component.
+    vocals : AudioConfig
+        Configuration settings for the vocals audio component.
+    instrumentals : AudioConfig
+        Configuration settings for the instrumentals audio component.
+    main_vocals : AudioConfig
+        Configuration settings for the main vocals audio component.
+    backup_vocals : AudioConfig
+        Configuration settings for the backup vocals audio component.
+    main_vocals_dereverbed : AudioConfig
+        Configuration settings for the main vocals de-reverbed audio
+        component.
+    main_vocals_reverb : AudioConfig
+        Configuration settings for the main vocals reverb audio
+        component.
+    converted_vocals : AudioConfig
+        Configuration settings for the converted vocals audio
+        component.
+    postprocessed_vocals : AudioConfig
+        Configuration settings for the postprocessed vocals audio
+        component.
+    instrumentals_shifted : AudioConfig
+        Configuration settings for the shifted instrumentals audio
+        component.
+    backup_vocals_shifted : AudioConfig
+        Configuration settings for the shifted backup vocals audio
+        component.
+    all : list[gr.Audio]
+        List of instances of all intermediate audio components.
+    """
+    song: AudioConfig = AudioConfig.intermediate(label="Song")
+    vocals: AudioConfig = AudioConfig.intermediate(label="Vocals")
+    instrumentals: AudioConfig = AudioConfig.intermediate(
+        label="Instrumentals",
+    )
+    main_vocals: AudioConfig = AudioConfig.intermediate(
+        label="Main vocals",
+    )
+    backup_vocals: AudioConfig = AudioConfig.intermediate(
+        label="Backup vocals",
+    )
+    main_vocals_dereverbed: AudioConfig = AudioConfig.intermediate(
+        label="De-reverbed main vocals",
+    )
+    main_vocals_reverb: AudioConfig = AudioConfig.intermediate(
+        label="Main vocals with reverb",
+    )
+    converted_vocals: AudioConfig = AudioConfig.intermediate(
+        label="Converted vocals",
+    )
+    postprocessed_vocals: AudioConfig = AudioConfig.intermediate(
+        label="Postprocessed vocals",
+    )
+    instrumentals_shifted: AudioConfig = AudioConfig.intermediate(
+        label="Pitch-shifted instrumentals",
+    )
+    backup_vocals_shifted: AudioConfig = AudioConfig.intermediate(
+        label="Pitch-shifted backup vocals",
+    )
+    @property
+    def all(self) -> list[gr.Audio]:
+        """
+        Retrieve instances of all intermediate audio components
+        in the one-click song generation tab.
+        Returns
+        -------
+        list[gr.Audio]
+            List of instances of all intermediate audio components in
+            the one-click song generation tab.
+        """
+        # NOTE we are using self.__annotations__ to get the fields in
+        # the order they are defined in the class
+        return [getattr(self, field).instance for field in self.__annotations__]
+class OneClickSongGenerationConfig(SongGenerationConfig):
+    """
+    Configuration settings for the one-click song generation tab.
+    Attributes
+    ----------
+    n_octaves : SliderConfig
+        Configuration settings for an octave pitch shift slider
+        component.
+    n_semitones : SliderConfig
+        Configuration settings for a semitone pitch shift slider
+        component.
+    show_intermediate_audio : CheckboxConfig
+        Configuration settings for a show intermediate audio checkbox
+        component.
+    intermediate_audio : SongIntermediateAudioConfig
+        Configuration settings for intermediate audio components.
+    See Also
+    --------
+    SongGenerationConfig
+        Parent model defining common component configuration settings
+        for song generation tabs.
+    """
+    n_octaves: SliderConfig = SliderConfig.octave_shift(
+        label="Vocal pitch shift",
+        info=(
+            "The number of octaves to shift the pitch of the converted vocals by. Use 1"
+            " for male-to-female and -1 for vice-versa."
+        ),
+    )
+    n_semitones: SliderConfig = SliderConfig.semitone_shift(
+        label="Overall pitch shift",
+        info=(
+            "The number of semi-tones to shift the pitch of the converted vocals,"
+            " instrumentals and backup vocals by."
+        ),
+    )
+    show_intermediate_audio: CheckboxConfig = CheckboxConfig(
+        label="Show intermediate audio",
+        info="Show intermediate audio tracks produced during song cover generation.",
+        value=False,
+        exclude_value=True,
+    )
+    intermediate_audio: SongIntermediateAudioConfig = SongIntermediateAudioConfig()
+class SongInputAudioConfig(BaseModel):
+    """
+    Configuration settings for input audio components in the multi-step
+    song generation tab.
+    Attributes
+    ----------
+    audio : AudioConfig
+        Configuration settings for the input audio component.
+    vocals : AudioConfig
+        Configuration settings for the vocals audio component.
+    converted_vocals : AudioConfig
+        Configuration settings for the converted vocals audio
+        component.
+    instrumentals : AudioConfig
+        Configuration settings for the instrumentals audio
+        component.
+    backup_vocals : AudioConfig
+        Configuration settings for the backup vocals audio
+        component.
+    main_vocals : AudioConfig
+        Configuration settings for the main vocals audio
+        component.
+    shifted_instrumentals : AudioConfig
+        Configuration settings for the shifted instrumentals audio
+        component.
+    shifted_backup_vocals : AudioConfig
+        Configuration settings for the shifted backup vocals audio
+        component.
+    all : list[AudioConfig]
+        List of configuration settings for all input audio
+        components in the multi-step song generation tab.
+    """
+    audio: AudioConfig = AudioConfig.input(label="Audio")
+    vocals: AudioConfig = AudioConfig.input(label="Vocals")
+    converted_vocals: AudioConfig = AudioConfig.input(label="Vocals")
+    instrumentals: AudioConfig = AudioConfig.input(label="Instrumentals")
+    backup_vocals: AudioConfig = AudioConfig.input(label="Backup vocals")
+    main_vocals: AudioConfig = AudioConfig.input(label="Main vocals")
+    shifted_instrumentals: AudioConfig = AudioConfig.input(label="Instrumentals")
+    shifted_backup_vocals: AudioConfig = AudioConfig.input(label="Backup vocals")
+    @property
+    def all(self) -> list[AudioConfig]:
+        """
+        Retrieve configuration settings for all input audio components
+        in the multi-step song generation tab.
+        Returns
+        -------
+        list[AudioConfig]
+            List of configuration settings for all input audio
+            components in the multi-step song generation tab.
+        """
+        return [getattr(self, field) for field in self.__annotations__]
+class SongDirsConfig(BaseModel):
+    """
+    Configuration settings for song directory components in the
+    multi-step song generation tab.
+    Attributes
+    ----------
+    separate_audio : DropdownConfig
+        Configuration settings for the song directory component
+        for separating audio.
+    convert_vocals : DropdownConfig
+        Configuration settings for the song directory component
+        for converting vocals.
+    postprocess_vocals : DropdownConfig
+        Configuration settings for the song directory component
+        for postprocessing vocals.
+    pitch_shift_background : DropdownConfig
+        Configuration settings for the song directory component
+        for pitch-shifting background audio.
+    mix : DropdownConfig
+        Configuration settings for the song directory component
+        for mixing audio.
+    all : list[gr.Dropdown]
+        List of instances of all song directory components in the
+        multi-step song generation tab.
+    """
+    separate_audio: DropdownConfig = DropdownConfig.song_dir()
+    convert_vocals: DropdownConfig = DropdownConfig.song_dir()
+    postprocess_vocals: DropdownConfig = DropdownConfig.song_dir()
+    pitch_shift_background: DropdownConfig = DropdownConfig.song_dir()
+    mix: DropdownConfig = DropdownConfig.song_dir()
+    @property
+    def all(self) -> list[gr.Dropdown]:
+        """
+        Retrieve instances of all song directory components in the
+        multi-step song generation tab.
+        Returns
+        -------
+        list[gr.Dropdown]
+            List of instances of all song directory components in
+            the multi-step song generation tab.
+        """
+        return [getattr(self, field).instance for field in self.__annotations__]
+class MultiStepSongGenerationConfig(SongGenerationConfig):
+    """
+    Configuration settings for multi-step song generation tab.
+    Attributes
+    ----------
+    separation_model : DropdownConfig
+        Configuration settings for a separation model dropdown
+        component.
+    segment_size : RadioConfig
+        Configuration settings for a segment size radio component.
+    n_octaves : SliderConfig
+        Configuration settings for an octave pitch shift slider
+        component.
+    n_semitones : SliderConfig
+        Configuration settings for a semitone pitch shift slider
+        component.
+    n_semitones_instrumentals : SliderConfig
+        Configuration settings for an instrumentals pitch shift slider
+        component.
+    n_semitones_backup_vocals : SliderConfig
+        Configuration settings for a backup vocals pitch shift slider
+        component.
+    input_audio : SongInputAudioConfig
+        Configuration settings for input audio components.
+    song_dirs : SongDirsConfig
+        Configuration settings for song directory components.
+    See Also
+    --------
+    SongGenerationConfig
+        Parent model defining common component configuration settings
+        for song generation tabs.
+    """
+    separation_model: DropdownConfig = DropdownConfig(
+        label="Separation model",
+        info="The model to use for audio separation.",
+        value=SeparationModel.UVR_MDX_NET_VOC_FT,
+        choices=list(SeparationModel2),
+    )
+    segment_size: RadioConfig = RadioConfig(
+        label="Segment size",
+        info=(
+            "The size of the segments into which the audio is split. Using a larger"
+            " size consumes more resources, but may give better results."
+        ),
+        value=SegmentSize.SEG_2048,
+        choices=list(SegmentSize),
+    )
+    n_octaves: SliderConfig = SliderConfig.octave_shift(
+        label="Pitch shift (octaves)",
+        info=(
+            "The number of octaves to pitch-shift the converted voice by. Use 1 for"
+            " male-to-female and -1 for vice-versa."
+        ),
+    )
+    n_semitones: SliderConfig = SliderConfig.semitone_shift(
+        label="Pitch shift (semi-tones)",
+        info=(
+            "The number of semi-tones to pitch-shift the converted vocals by. Altering"
+            " this slightly reduces sound quality."
+        ),
+    )
+    n_semitones_instrumentals: SliderConfig = SliderConfig.semitone_shift(
+        label="Instrumental pitch shift",
+        info="The number of semi-tones to pitch-shift the instrumentals by.",
+    )
+    n_semitones_backup_vocals: SliderConfig = SliderConfig.semitone_shift(
+        label="Backup vocal pitch shift",
+        info="The number of semi-tones to pitch-shift the backup vocals by.",
+    )
+    input_audio: SongInputAudioConfig = SongInputAudioConfig()
+    song_dirs: SongDirsConfig = SongDirsConfig()
+class SpeechIntermediateAudioConfig(BaseModel):
+    """
+    Configuration settings for intermediate audio components in the
+    one-click speech generation tab.
+    Attributes
+    ----------
+    speech : AudioConfig
+        Configuration settings for the input speech audio component.
+    converted_speech : AudioConfig
+        Configuration settings for the converted speech audio component.
+    all : list[gr.Audio]
+        List of instances of all intermediate audio components in the
+        speech generation tab.
+    """
+    speech: AudioConfig = AudioConfig.intermediate(label="Speech")
+    converted_speech: AudioConfig = AudioConfig.intermediate(label="Converted speech")
+    @property
+    def all(self) -> list[gr.Audio]:
+        """
+        Retrieve instances of all intermediate audio components in the
+        speech generation tab.
+        Returns
+        -------
+        list[gr.Audio]
+            List of instances of all intermediate audio components in
+            the speech generation tab.
+        """
+        return [getattr(self, field).instance for field in self.__annotations__]
+class OneClickSpeechGenerationConfig(SpeechGenerationConfig):
+    """
+    Configuration settings for one-click speech generation tab.
+    Attributes
+    ----------
+    intermediate_audio : SpeechIntermediateAudioConfig
+        Configuration settings for intermediate audio components.
+    show_intermediate_audio : CheckboxConfig
+        Configuration settings for a show intermediate audio checkbox
+        component.
+    See Also
+    --------
+    SpeechGenerationConfig
+        Parent model defining common component configuration settings
+        for speech generation tabs.
+    """
+    intermediate_audio: SpeechIntermediateAudioConfig = SpeechIntermediateAudioConfig()
+    show_intermediate_audio: CheckboxConfig = CheckboxConfig(
+        label="Show intermediate audio",
+        info="Show intermediate audio tracks produced during speech generation.",
+        value=False,
+        exclude_value=True,
+    )
+class SpeechInputAudioConfig(BaseModel):
+    """
+    Configuration settings for input audio components in the multi-step
+    speech generation tab.
+    Attributes
+    ----------
+    speech : AudioConfig
+        Configuration settings for the input speech audio component.
+    converted_speech : AudioConfig
+        Configuration settings for the converted speech audio component.
+    all : list[AudioConfig]
+        List of configuration settings for all input audio components in
+        the multi-step speech generation tab.
+    """
+    speech: AudioConfig = AudioConfig.input("Speech")
+    converted_speech: AudioConfig = AudioConfig.input("Converted speech")
+    @property
+    def all(self) -> list[AudioConfig]:
+        """
+        Retrieve configuration settings for all input audio components
+        in the multi-step speech generation tab.
+        Returns
+        -------
+        list[AudioConfig]
+            List of configuration settings for all input audio
+            components in the multi-step speech generation tab.
+        """
+        return [getattr(self, field) for field in self.__annotations__]
+class MultiStepSpeechGenerationConfig(SpeechGenerationConfig):
+    """
+    Configuration settings for the multi-step speech generation tab.
+    Attributes
+    ----------
+    input_audio : SpeechInputAudioConfig
+        Configuration settings for input audio components.
+    See Also
+    --------
+    SpeechGenerationConfig
+        Parent model defining common component configuration settings
+        for speech generation tabs.
+    """
+    input_audio: SpeechInputAudioConfig = SpeechInputAudioConfig()
+class MultiStepTrainingConfig(TrainingConfig):
+    """Configuration settings for multi-step training tab."""
+class ModelManagementConfig(BaseModel):
+    """
+    Configuration settings for model management tab.
+    Attributes
+    ----------
+    voices : DropdownConfig
+        Configuration settings for delete voice models dropdown
+        component.
+    embedders : DropdownConfig
+        Configuration settings for delete embedder models dropdown
+        component.
+    pretraineds : DropdownConfig
+        Configuration settings for delete pretrained models dropdown
+        component.
+    traineds : DropdownConfig
+        Configuration settings for delete training models dropdown
+        component.
+    dummy_checkbox : CheckboxConfig
+        Configuration settings for a dummy checkbox component.
+    """
+    voices: DropdownConfig = DropdownConfig.multi_delete(
+        label="Voice models",
+        info="Select one or more voice models to delete.",
+    )
+    embedders: DropdownConfig = DropdownConfig.multi_delete(
+        label="Custom embedder models",
+        info="Select one or more embedder models to delete.",
+    )
+    pretraineds: DropdownConfig = DropdownConfig.multi_delete(
+        label="Custom pretrained models",
+        info="Select one or more pretrained models to delete.",
+    )
+    traineds: DropdownConfig = DropdownConfig.multi_delete(
+        label="Training models",
+        info="Select one or more training models to delete.",
+    )
+    dummy_checkbox: CheckboxConfig = CheckboxConfig(
+        value=False,
+        visible=False,
+        exclude_value=True,
+    )
+class AudioManagementConfig(BaseModel):
+    """
+    Configuration settings for audio management tab.
+    Attributes
+    ----------
+    intermediate : DropdownConfig
+        Configuration settings for delete intermediate audio files
+        dropdown component
+    speech : DropdownConfig
+        Configuration settings for delete speech audio files dropdown
+        component.
+    output : DropdownConfig
+        Configuration settings for delete output audio files dropdown
+        component.
+    dataset : DropdownConfig
+        Configuration settings for delete dataset audio files dropdown
+        component.
+    dummy_checkbox : CheckboxConfig
+        Configuration settings for a dummy checkbox component.
+    """
+    intermediate: DropdownConfig = DropdownConfig.multi_delete(
+        label="Song directories",
+        info=(
+            "Select one or more song directories containing intermediate audio files to"
+            " delete."
+        ),
+    )
+    speech: DropdownConfig = DropdownConfig.multi_delete(
+        label="Speech audio files",
+        info="Select one or more speech audio files to delete.",
+    )
+    output: DropdownConfig = DropdownConfig.multi_delete(
+        label="Output audio files",
+        info="Select one or more output audio files to delete.",
+    )
+    dataset: DropdownConfig = DropdownConfig.multi_delete(
+        label="Dataset audio files",
+        info="Select one or more datasets containing audio files to delete.",
+    )
+    dummy_checkbox: CheckboxConfig = CheckboxConfig(
+        value=False,
+        visible=False,
+        exclude_value=True,
+    )
+class SettingsManagementConfig(BaseModel):
+    """
+    Configuration settings for settings management tab.
+    Attributes
+    ----------
+    dummy_checkbox : CheckboxConfig
+        Configuration settings for a dummy checkbox component.
+    """
+    load_config_name: DropdownConfig = DropdownConfig(
+        label="Configuration name",
+        info="The name of a configuration to load UI settings from",
+        value=None,
+        render=False,
+        exclude_value=True,
+    )
+    delete_config_names: DropdownConfig = DropdownConfig.multi_delete(
+        label="Configuration names",
+        info="Select the name of one or more configurations to delete",
+    )
+    dummy_checkbox: CheckboxConfig = CheckboxConfig(
+        value=False,
+        visible=False,
+        exclude_value=True,
+    )
+class TotalSongGenerationConfig(BaseModel):
+    """
+    All configuration settings for song generation tabs.
+    Attributes
+    ----------
+    one_click : OneClickSongGenerationConfig
+        Configuration settings for the one-click song generation tab.
+    multi_step : MultiStepSongGenerationConfig
+        Configuration settings for the multi-step song generation tab.
+    """
+    one_click: OneClickSongGenerationConfig = OneClickSongGenerationConfig()
+    multi_step: MultiStepSongGenerationConfig = MultiStepSongGenerationConfig()
+class TotalSpeechGenerationConfig(BaseModel):
+    """
+    All configuration settings for speech generation tabs.
+    Attributes
+    ----------
+    one_click : OneClickSpeechGenerationConfig
+        Configuration settings for the one-click speech generation tab.
+    multi_step : MultiStepSpeechGenerationConfig
+        Configuration settings for the multi-step speech generation tab.
+    """
+    one_click: OneClickSpeechGenerationConfig = OneClickSpeechGenerationConfig()
+    multi_step: MultiStepSpeechGenerationConfig = MultiStepSpeechGenerationConfig()
+class TotalTrainingConfig(BaseModel):
+    """
+    All configuration settings for training tabs.
+    Attributes
+    ----------
+    training : TrainingConfig
+        Configuration settings for the multi-step training tab.
+    """
+    multi_step: MultiStepTrainingConfig = MultiStepTrainingConfig()
+class TotalManagementConfig(BaseModel):
+    """
+    All configuration settings for management tabs.
+    Attributes
+    ----------
+    model : ModelManagementConfig
+        Configuration settings for the model management tab.
+    audio : AudioManagementConfig
+        Configuration settings for the audio management tab.
+    settings : SettingsManagementConfig
+        Configuration settings for the settings management tab.
+    """
+    model: ModelManagementConfig = ModelManagementConfig()
+    audio: AudioManagementConfig = AudioManagementConfig()
+    settings: SettingsManagementConfig = SettingsManagementConfig()
+class TotalConfig(BaseModel):
+    """
+    All configuration settings for the Ultimate RVC app.
+    Attributes
+    ----------
+    song : TotalSongGenerationConfig
+        Configuration settings for song generation tabs.
+    speech : TotalSpeechGenerationConfig
+        Configuration settings for speech generation tabs.
+    training : TotalTrainingConfig
+        Configuration settings for training tabs.
+    management : TotalManagementConfig
+        Configuration settings for management tabs.
+    """
+    song: TotalSongGenerationConfig = TotalSongGenerationConfig()
+    speech: TotalSpeechGenerationConfig = TotalSpeechGenerationConfig()
+    training: TotalTrainingConfig = TotalTrainingConfig()
+    management: TotalManagementConfig = TotalManagementConfig()
+    @cached_property
+    def all(self) -> list[AnyComponentConfig]:
+        """
+        Recursively collect those component configuration models nested
+        within the current model instance, which have values that are
+        not excluded.
+        Returns
+        -------
+        list[AnyComponentConfig]
+            A list of component configuration models found within the
+            current model instance, which have values that are not
+            excluded.
+        """
+        def _collect(model: BaseModel) -> list[AnyComponentConfig]:
+            component_configs: list[Any] = []
+            for _, value in model:
+                if isinstance(value, ComponentConfig):
+                    if not value.exclude_value:
+                        component_configs.append(value)
+                elif isinstance(value, BaseModel):
+                    component_configs.extend(_collect(value))
+            return component_configs
+        return _collect(self)
 def render_app() -> gr.Blocks:
     """
     Render the Ultimate RVC web application.
     cache_delete_cutoff = 86400  # and delete files older than 24 hours
     with gr.Blocks(
+        title="Redzone-6 Audio Playground",
         theme=gr.Theme.load(str(Path(__file__).parent / "config/theme.json")),
         css=css,
         delete_cache=(cache_delete_frequency, cache_delete_cutoff),
     ) as app:
         for component_config in [
             total_config.song.one_click.voice_model,
             total_config.song.one_click.cached_song,
         ]:
             component_config.instantiate()
         # main tab
+        # with gr.Tab("Generate", elem_id="generate-tab"):
+        with gr.Tab("RCV Suite" elem_id="generate-tab"):
+            render_song_cover_one_click_tab(total_config, cookiefile)
+            render_song_cover_multi_step_tab(total_config, cookiefile)
+        with gr.Tab("Speech" elem_id="generate-tab"):
+            render_speech_one_click_tab(total_config)
+            render_speech_multi_step_tab(total_config)
+        with gr.Tab("Configuration", elem_id="settings-tab"):
+            with gr.Tab("Models", elem_id="manage-tab"):
+                render_models_tab(total_config)
+            with gr.Tab("Settings", elem_id="settings-tab"):
+                render_settings_tab(total_config)
+#            with gr.Tab("Audio", elem_id="audio-tab"):
+                render_audio_tab(total_config)
         app.load(
             _init_dropdowns,
             "-h",
             help="The hostname that the server will use.",
         ),
+    ] = "0.0.0.0",
     listen_port: Annotated[
         int | None,
         typer.Option(
     """Run the Ultimate RVC web application."""
     os.environ["GRADIO_TEMP_DIR"] = str(TEMP_DIR)
     gr.set_static_paths([MODELS_DIR, AUDIO_DIR])
+#    app.queue()
     app.launch(
+        server_name=listen_host,
         server_port=listen_port,
         ssr_mode=ssr_mode,
     )
+load_config("default", TotalConfig)
+load_config("theme", TotalConfig)
 if __name__ == "__main__":
     app_wrapper()