Spaces:

Offex
/

Jdjd

Sleeping

App Files Files Community

Offex commited on Feb 16

Commit

de8428e

verified ·

1 Parent(s): 5f3a8eb

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -9

app.py CHANGED Viewed

@@ -15,7 +15,16 @@ def remove_silence(audio_path):
         return None
     wav = read_audio(audio_path, sampling_rate=16000)
-    speech_timestamps = get_speech_timestamps(wav, model, sampling_rate=16000)
     if not speech_timestamps:
         return audio_path
@@ -36,25 +45,24 @@ css = """
     text-align: center;
     font-size: 28px;
     font-weight: bold;
-    font-family: 'Comic Sans MS', 'Trebuchet MS', sans-serif; /* MS Font lagaya gaya hai */
     animation: rgb-glow 2.5s linear infinite;
     padding: 12px;
     letter-spacing: 2px;
     margin: 15px 0;
-    border: 2px dashed #ddd; /* Thoda stylish border */
     border-radius: 10px;
-    background-color: rgba(0, 0, 0, 0.02); /* Halka sa background */
 }
 """
 # ---- Gradio Blocks (Advanced UI) ----
 with gr.Blocks(css=css, title="AI Silence Remover") as iface:
-    # 1. TOP WALA ANIMATED TAG
     gr.HTML('<div class="deepu-brand">✨ Made by Deepu ✨</div>')
-    gr.Markdown("<h1 style='text-align: center;'>🎙️ AI Silence Remover (Silero VAD)</h1>")
-    gr.Markdown("<p style='text-align: center;'>Apni audio upload karein aur AI automatically non-speech parts ko cut kar dega.</p>")
     with gr.Row():
         audio_in = gr.Audio(type="filepath", label="Raw Audio Upload Karein")
@@ -64,10 +72,8 @@ with gr.Blocks(css=css, title="AI Silence Remover") as iface:
     with gr.Row():
         audio_out = gr.Audio(type="filepath", label="Processed Audio (Without Silence)")
-    # 2. BOTTOM WALA ANIMATED TAG
     gr.HTML('<div class="deepu-brand">✨ Made by Deepu ✨</div>')
-    # Button ko function ke sath jodna
     submit_btn.click(fn=remove_silence, inputs=audio_in, outputs=audio_out)
 if __name__ == "__main__":

         return None
     wav = read_audio(audio_path, sampling_rate=16000)
+    # 🔴 YAHAN MAGIC HUA HAI: AI ko aur strict banaya gaya hai 🔴
+    speech_timestamps = get_speech_timestamps(
+        wav,
+        model,
+        sampling_rate=16000,
+        threshold=0.5,                # Aawaz pehchanne ki limit
+        min_silence_duration_ms=50,   # Agar 50 millisecond ka bhi gap ho, toh use cut kar do (Pehle ye zyada tha)
+        speech_pad_ms=10              # Aawaz ke aage-peeche ka gap sirf 10ms rakha hai (Pehle AI zyada gap chhod raha tha)
+    )
     if not speech_timestamps:
         return audio_path
     text-align: center;
     font-size: 28px;
     font-weight: bold;
+    font-family: 'Comic Sans MS', 'Trebuchet MS', sans-serif;
     animation: rgb-glow 2.5s linear infinite;
     padding: 12px;
     letter-spacing: 2px;
     margin: 15px 0;
+    border: 2px dashed #ddd;
     border-radius: 10px;
+    background-color: rgba(0, 0, 0, 0.02);
 }
 """
 # ---- Gradio Blocks (Advanced UI) ----
 with gr.Blocks(css=css, title="AI Silence Remover") as iface:
     gr.HTML('<div class="deepu-brand">✨ Made by Deepu ✨</div>')
+    gr.Markdown("<h1 style='text-align: center;'>🎙️ AI Silence Remover (Aggressive Mode)</h1>")
+    gr.Markdown("<p style='text-align: center;'>Apni audio upload karein. Yeh version chote se chote gap ko bhi cut karega!</p>")
     with gr.Row():
         audio_in = gr.Audio(type="filepath", label="Raw Audio Upload Karein")
     with gr.Row():
         audio_out = gr.Audio(type="filepath", label="Processed Audio (Without Silence)")
     gr.HTML('<div class="deepu-brand">✨ Made by Deepu ✨</div>')
     submit_btn.click(fn=remove_silence, inputs=audio_in, outputs=audio_out)
 if __name__ == "__main__":