sbapan41 commited on
Commit
60afedf
Β·
verified Β·
1 Parent(s): 466ae5e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -10
app.py CHANGED
@@ -13,7 +13,7 @@ import csv
13
  import datetime
14
 
15
  device = "cuda" if torch.cuda.is_available() else "cpu"
16
- MODEL_NAME="nvidia/parakeet-tdt-0.6b-v2"
17
 
18
  model = ASRModel.from_pretrained(model_name=MODEL_NAME)
19
  model.eval()
@@ -313,24 +313,17 @@ def play_segment(evt: gr.SelectData, raw_ts_list, current_audio_path):
313
 
314
  article = (
315
  "<p style='font-size: 1.1em;'>"
316
- "This demo showcases <code><a href='https://huggingface.co/nvidia/parakeet-tdt-0.6b-v2'>parakeet-tdt-0.6b-v2</a></code>, a 600-million-parameter model designed for high-quality English speech recognition."
317
  "</p>"
318
  "<p><strong style='color: red; font-size: 1.2em;'>Key Features:</strong></p>"
319
  "<ul style='font-size: 1.1em;'>"
320
  " <li>Automatic punctuation and capitalization</li>"
321
  " <li>Accurate word-level timestamps (click on a segment in the table below to play it!)</li>"
322
- " <li>Efficiently transcribes long audio segments (<strong>updated to support upto 3 hours</strong>) <small>(For even longer audios, see <a href='https://github.com/NVIDIA/NeMo/blob/main/examples/asr/asr_chunked_inference/rnnt/speech_to_text_buffered_infer_rnnt.py' target='_blank'>this script</a>)</small></li>"
323
  " <li>Robust performance on spoken numbers, and song lyrics transcription </li>"
324
  "</ul>"
325
  "<p style='font-size: 1.1em;'>"
326
  "This model is <strong>available for commercial and non-commercial use</strong>."
327
- "</p>"
328
- "<p style='text-align: center;'>"
329
- "<a href='https://huggingface.co/nvidia/parakeet-tdt-0.6b-v2' target='_blank'>πŸŽ™οΈ Learn more about the Model</a> | "
330
- "<a href='https://arxiv.org/abs/2305.05084' target='_blank'>πŸ“„ Fast Conformer paper</a> | "
331
- "<a href='https://arxiv.org/abs/2304.06795' target='_blank'>πŸ“š TDT paper</a> | "
332
- "<a href='https://github.com/NVIDIA/NeMo' target='_blank'>πŸ§‘β€πŸ’» NeMo Repository</a>"
333
- "</p>"
334
  )
335
 
336
  examples = [
 
13
  import datetime
14
 
15
  device = "cuda" if torch.cuda.is_available() else "cpu"
16
+ MODEL_NAME="Quantumhash/Quantum_STT_V2.0"
17
 
18
  model = ASRModel.from_pretrained(model_name=MODEL_NAME)
19
  model.eval()
 
313
 
314
  article = (
315
  "<p style='font-size: 1.1em;'>"
316
+ "This demo showcases <code><a href='https://huggingface.co/Quantumhash/Quantum_STT_V2.0</a></code>, a 600-million-parameter model designed for high-quality English speech recognition."
317
  "</p>"
318
  "<p><strong style='color: red; font-size: 1.2em;'>Key Features:</strong></p>"
319
  "<ul style='font-size: 1.1em;'>"
320
  " <li>Automatic punctuation and capitalization</li>"
321
  " <li>Accurate word-level timestamps (click on a segment in the table below to play it!)</li>"
322
+ " <li>Efficiently transcribes long audio segments (<strong>updated to support upto 3 hours</strong>)</li>"
323
  " <li>Robust performance on spoken numbers, and song lyrics transcription </li>"
324
  "</ul>"
325
  "<p style='font-size: 1.1em;'>"
326
  "This model is <strong>available for commercial and non-commercial use</strong>."
 
 
 
 
 
 
 
327
  )
328
 
329
  examples = [