notmax123 commited on
Commit
8960a88
·
1 Parent(s): c329763

Tuning: CFG 4.0; tighten steps (5-16) and speed (0.8-1.2) slider ranges

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -592,7 +592,7 @@ class BlueTTS:
592
  style: Style,
593
  total_step: int = 8,
594
  speed: float = 0.95,
595
- cfg_scale: float = 3.5,
596
  silence_duration: float = 0.15,
597
  seed: int = 42,
598
  phonemize: bool = True,
@@ -861,7 +861,7 @@ def synthesize_text(text: str, voice: str, lang: str, steps: int, speed: float,
861
  style = VOICE_STYLES[voice]
862
  wav, sr = TTS.synthesize(
863
  expand_numbers(normalize_common_text(text), lang=lang), lang=lang, style=style,
864
- total_step=int(steps), speed=float(speed), cfg_scale=3.5,
865
  pace_blend=0.0,
866
  )
867
  wav = normalize_generated_audio(np.asarray(wav).squeeze())
@@ -1033,8 +1033,8 @@ with gr.Blocks(title="BlueTTS V2 — Multilingual TTS") as demo:
1033
  label="Voice", elem_classes="ctrl-voice",
1034
  )
1035
  with gr.Row(elem_classes="ctrl-row2"):
1036
- steps_input = gr.Slider(2, 32, 8, step=1, label="Quality (steps)", elem_classes="ctrl-steps")
1037
- speed_input = gr.Slider(0.5, 2.0, 0.95, step=0.05, label="Speed", elem_classes="ctrl-speed")
1038
 
1039
  with gr.Column(elem_classes="ref-panel"):
1040
  gr.HTML(
 
592
  style: Style,
593
  total_step: int = 8,
594
  speed: float = 0.95,
595
+ cfg_scale: float = 4.0,
596
  silence_duration: float = 0.15,
597
  seed: int = 42,
598
  phonemize: bool = True,
 
861
  style = VOICE_STYLES[voice]
862
  wav, sr = TTS.synthesize(
863
  expand_numbers(normalize_common_text(text), lang=lang), lang=lang, style=style,
864
+ total_step=int(steps), speed=float(speed), cfg_scale=4.0,
865
  pace_blend=0.0,
866
  )
867
  wav = normalize_generated_audio(np.asarray(wav).squeeze())
 
1033
  label="Voice", elem_classes="ctrl-voice",
1034
  )
1035
  with gr.Row(elem_classes="ctrl-row2"):
1036
+ steps_input = gr.Slider(5, 16, 8, step=1, label="Quality (steps)", elem_classes="ctrl-steps")
1037
+ speed_input = gr.Slider(0.8, 1.2, 0.95, step=0.05, label="Speed", elem_classes="ctrl-speed")
1038
 
1039
  with gr.Column(elem_classes="ref-panel"):
1040
  gr.HTML(