Spaces:

dkounadis
/

audiogen2

Sleeping

Dionyssos commited on Sep 27, 2025

Commit

1ad4a8a

1 Parent(s): f653575

dont run all tokens for short dur

Files changed (1) hide show

app.py CHANGED Viewed

@@ -17,13 +17,13 @@ def audionar_tts(text='frogs',
     if text and text.strip():
-        dur_seconds = max(duration + 0.74, 2.0)
-        # Sink Attn
         background_audio = audiogen.generate(
-            text[:64],  # soundscape text - discard if too long cross attention T5
-            duration=dur_seconds,
-            max_tokens=max(7, int(max_tokens)),  # kv cache lowest n_preserve
-            cache_lim=max(6, int(cache_lim)),
          ).numpy()
     else:
@@ -48,14 +48,14 @@ with gr.Blocks() as demo:
         )
         duration = gr.Number(
             label="Duration (s)",
-            value=7.1,
         )
         n_tokens = gr.Number(
             label="Tokens",
             value=24,
         )
         cache_lim = gr.Number(
-            label="kv Cache Flush:",
             value=71,
         )
         generate_button = gr.Button("Generate Audio",

     if text and text.strip():
+        duration = max(duration + 0.74, 2.0)
         background_audio = audiogen.generate(
+            text[:64],         # soundscape text - discard if too long cross attention
+            duration=duration, # dont use all A/R tokens if duration is shorter than tokens<<
+            max_tokens=min(max(7, int(max_tokens)), int(duration * 50))  # kv cache lowest n_preserve
+            cache_lim=max(6, int(cache_lim)),         # Sink Attn
          ).numpy()
     else:
         )
         duration = gr.Number(
             label="Duration (s)",
+            value=7.24,
         )
         n_tokens = gr.Number(
             label="Tokens",
             value=24,
         )
         cache_lim = gr.Number(
+            label="kv Flush",
             value=71,
         )
         generate_button = gr.Button("Generate Audio",