Update app.py
Browse files
app.py
CHANGED
|
@@ -13,7 +13,7 @@ import csv
|
|
| 13 |
import datetime
|
| 14 |
|
| 15 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
| 16 |
-
MODEL_NAME="
|
| 17 |
|
| 18 |
model = ASRModel.from_pretrained(model_name=MODEL_NAME)
|
| 19 |
model.eval()
|
|
@@ -313,24 +313,17 @@ def play_segment(evt: gr.SelectData, raw_ts_list, current_audio_path):
|
|
| 313 |
|
| 314 |
article = (
|
| 315 |
"<p style='font-size: 1.1em;'>"
|
| 316 |
-
"This demo showcases <code><a href='https://huggingface.co/
|
| 317 |
"</p>"
|
| 318 |
"<p><strong style='color: red; font-size: 1.2em;'>Key Features:</strong></p>"
|
| 319 |
"<ul style='font-size: 1.1em;'>"
|
| 320 |
" <li>Automatic punctuation and capitalization</li>"
|
| 321 |
" <li>Accurate word-level timestamps (click on a segment in the table below to play it!)</li>"
|
| 322 |
-
" <li>Efficiently transcribes long audio segments (<strong>updated to support upto 3 hours</strong>)
|
| 323 |
" <li>Robust performance on spoken numbers, and song lyrics transcription </li>"
|
| 324 |
"</ul>"
|
| 325 |
"<p style='font-size: 1.1em;'>"
|
| 326 |
"This model is <strong>available for commercial and non-commercial use</strong>."
|
| 327 |
-
"</p>"
|
| 328 |
-
"<p style='text-align: center;'>"
|
| 329 |
-
"<a href='https://huggingface.co/nvidia/parakeet-tdt-0.6b-v2' target='_blank'>ποΈ Learn more about the Model</a> | "
|
| 330 |
-
"<a href='https://arxiv.org/abs/2305.05084' target='_blank'>π Fast Conformer paper</a> | "
|
| 331 |
-
"<a href='https://arxiv.org/abs/2304.06795' target='_blank'>π TDT paper</a> | "
|
| 332 |
-
"<a href='https://github.com/NVIDIA/NeMo' target='_blank'>π§βπ» NeMo Repository</a>"
|
| 333 |
-
"</p>"
|
| 334 |
)
|
| 335 |
|
| 336 |
examples = [
|
|
|
|
| 13 |
import datetime
|
| 14 |
|
| 15 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
| 16 |
+
MODEL_NAME="Quantumhash/Quantum_STT_V2.0"
|
| 17 |
|
| 18 |
model = ASRModel.from_pretrained(model_name=MODEL_NAME)
|
| 19 |
model.eval()
|
|
|
|
| 313 |
|
| 314 |
article = (
|
| 315 |
"<p style='font-size: 1.1em;'>"
|
| 316 |
+
"This demo showcases <code><a href='https://huggingface.co/Quantumhash/Quantum_STT_V2.0</a></code>, a 600-million-parameter model designed for high-quality English speech recognition."
|
| 317 |
"</p>"
|
| 318 |
"<p><strong style='color: red; font-size: 1.2em;'>Key Features:</strong></p>"
|
| 319 |
"<ul style='font-size: 1.1em;'>"
|
| 320 |
" <li>Automatic punctuation and capitalization</li>"
|
| 321 |
" <li>Accurate word-level timestamps (click on a segment in the table below to play it!)</li>"
|
| 322 |
+
" <li>Efficiently transcribes long audio segments (<strong>updated to support upto 3 hours</strong>)</li>"
|
| 323 |
" <li>Robust performance on spoken numbers, and song lyrics transcription </li>"
|
| 324 |
"</ul>"
|
| 325 |
"<p style='font-size: 1.1em;'>"
|
| 326 |
"This model is <strong>available for commercial and non-commercial use</strong>."
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 327 |
)
|
| 328 |
|
| 329 |
examples = [
|