Spaces:

LT4Ryan
/

AudioDog

Sleeping

App Files Files Community

LT4Ryan commited on Aug 7, 2025

Commit

77fe306

verified ·

1 Parent(s): 150ffdc

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -11

app.py CHANGED Viewed

@@ -123,8 +123,8 @@ def get_transcripts_and_raw_times(audio_path):
     model.cpu()
     gc.collect()
-    #if device == "cuda":
-     #   torch.cuda.empty_cache()
     # Generate CSV
     button_update = gr.DownloadButton(visible=False)
@@ -189,17 +189,18 @@ def play_segment(evt: gr.SelectData, raw_ts_list, current_audio_path):
         return gr.Audio(value=None, label="Selected Segment")
 article = (
-    "<p style='font-size: 1.1em;'>"
-    "AudioDog uses <code><a href='https://huggingface.co/nvidia/parakeet-tdt-0.6b-v2'>parakeet-tdt-0.6b-v2</a></code>, a 600-million-parameter model designed for high-quality English speech recognition."
-    "</p>"
     "<p><strong style='color: red; font-size: 1.2em;'>Key Features:</strong></p>"
-    "<ul style='font-size: 1.1em;'>"
-    "    <li>Automatic punctuation and capitalization</li>"
-    "    <li>Accurate word-level timestamps (click on a segment in the table below to play it!)</li>"
-    "    <li>Efficiently transcribes long audio segments by chunking them into smaller segments and stitching them together when done.</li>"
-    "    <li>MP3 support for audio input and output, works well on downloaded YouTube videos.</li>"
     "</ul>"
 )
 examples = [
     ["data/example-yt_saTD1u8PorI.mp3"],
 ]
@@ -208,7 +209,7 @@ examples = [
 # Define an NVIDIA-inspired theme
 nvidia_theme = gr_themes.Default(
     primary_hue=gr_themes.Color(
-        c50="#E6F1D9", # Lightest green
         c100="#CEE3B3",
         c200="#B5D58C",
         c300="#9CC766",

     model.cpu()
     gc.collect()
+    if device == "cuda":
+        torch.cuda.empty_cache()
     # Generate CSV
     button_update = gr.DownloadButton(visible=False)
         return gr.Audio(value=None, label="Selected Segment")
 article = (
+    "<div style='font-size: 1.1em;'>"
+    "<p>AudioDog uses <code><a href='https://huggingface.co/nvidia/parakeet-tdt-0.6b-v2'>parakeet-tdt-0.6b-v2</a></code>, a 600-million-parameter model designed for high-quality English speech recognition.</p>"
     "<p><strong style='color: red; font-size: 1.2em;'>Key Features:</strong></p>"
+    "<ul>"
+    "<li>Automatic punctuation and capitalization</li>"
+    "<li>Accurate word-level timestamps (click on a segment in the table below to play it!)</li>"
+    "<li>Efficiently transcribes long audio segments by chunking them into smaller segments and stitching them together when done.</li>"
+    "<li>MP3 support for audio input and output, works well on downloaded YouTube videos.</li>"
     "</ul>"
+    "</div>"
 )
 examples = [
     ["data/example-yt_saTD1u8PorI.mp3"],
 ]
 # Define an NVIDIA-inspired theme
 nvidia_theme = gr_themes.Default(
     primary_hue=gr_themes.Color(
+        c50="#E5F1D9", # Lightest green
         c100="#CEE3B3",
         c200="#B5D58C",
         c300="#9CC766",