End of training
Browse files- e5_interleaving-cl.ipynb +137 -253
- e5_interleaving-resume.ipynb +0 -0
- pytorch_model.bin +1 -1
- runs/Dec13_21-29-08_129-146-102-49/1670966960.518305/events.out.tfevents.1670966960.129-146-102-49.882304.1 +3 -0
- runs/Dec13_21-29-08_129-146-102-49/events.out.tfevents.1670966960.129-146-102-49.882304.0 +3 -0
- runs/Dec13_21-57-38_129-146-102-49/1670968669.9597044/events.out.tfevents.1670968669.129-146-102-49.882304.3 +3 -0
- runs/Dec13_21-57-38_129-146-102-49/events.out.tfevents.1670968669.129-146-102-49.882304.2 +3 -0
- runs/Dec13_22-18-00_129-146-102-49/1670969892.775061/events.out.tfevents.1670969892.129-146-102-49.1014402.1 +3 -0
- runs/Dec13_22-18-00_129-146-102-49/1670995449.379962/events.out.tfevents.1670995449.129-146-102-49.1014402.2 +3 -0
- runs/Dec13_22-18-00_129-146-102-49/events.out.tfevents.1670969892.129-146-102-49.1014402.0 +3 -0
- runs/Dec14_05-46-08_129-146-102-49/1670996781.2697837/events.out.tfevents.1670996781.129-146-102-49.1113148.1 +3 -0
- runs/Dec14_05-46-08_129-146-102-49/events.out.tfevents.1670996781.129-146-102-49.1113148.0 +3 -0
- runs/Dec14_09-33-49_129-146-102-49/1671010439.939292/events.out.tfevents.1671010439.129-146-102-49.1212260.1 +3 -0
- runs/Dec14_09-33-49_129-146-102-49/events.out.tfevents.1671010439.129-146-102-49.1212260.0 +3 -0
- runs/Dec14_10-24-09_129-146-102-49/1671013461.8981154/events.out.tfevents.1671013461.129-146-102-49.1508853.1 +3 -0
- runs/Dec14_10-24-09_129-146-102-49/events.out.tfevents.1671013461.129-146-102-49.1508853.0 +3 -0
- training_args.bin +1 -1
e5_interleaving-cl.ipynb
CHANGED
|
@@ -125,20 +125,20 @@
|
|
| 125 |
"Requirement already satisfied: torch in ./.local/lib/python3.8/site-packages (1.13.0)\n",
|
| 126 |
"Requirement already satisfied: torchaudio in ./.local/lib/python3.8/site-packages (0.13.0)\n",
|
| 127 |
"Requirement already satisfied: torchvision in ./.local/lib/python3.8/site-packages (0.14.0)\n",
|
|
|
|
|
|
|
| 128 |
"Requirement already satisfied: nvidia-cublas-cu11==11.10.3.66 in ./.local/lib/python3.8/site-packages (from torch) (11.10.3.66)\n",
|
| 129 |
-
"Requirement already satisfied: nvidia-cuda-nvrtc-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
|
| 130 |
"Requirement already satisfied: typing-extensions in ./.local/lib/python3.8/site-packages (from torch) (4.4.0)\n",
|
| 131 |
-
"Requirement already satisfied: nvidia-
|
| 132 |
-
"Requirement already satisfied: nvidia-cuda-runtime-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
|
| 133 |
-
"Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (45.2.0)\n",
|
| 134 |
"Requirement already satisfied: wheel in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (0.34.2)\n",
|
| 135 |
-
"Requirement already satisfied:
|
| 136 |
"Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /usr/lib/python3/dist-packages (from torchvision) (7.0.0)\n",
|
|
|
|
| 137 |
"Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from torchvision) (1.23.5)\n",
|
| 138 |
-
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->torchvision) (1.26.13)\n",
|
| 139 |
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->torchvision) (2019.11.28)\n",
|
| 140 |
-
"Requirement already satisfied:
|
| 141 |
-
"Requirement already satisfied:
|
|
|
|
| 142 |
]
|
| 143 |
}
|
| 144 |
],
|
|
@@ -200,7 +200,7 @@
|
|
| 200 |
"name": "stdout",
|
| 201 |
"output_type": "stream",
|
| 202 |
"text": [
|
| 203 |
-
"Tue Dec 13
|
| 204 |
"+-----------------------------------------------------------------------------+\n",
|
| 205 |
"| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
|
| 206 |
"|-------------------------------+----------------------+----------------------+\n",
|
|
@@ -209,7 +209,7 @@
|
|
| 209 |
"| | | MIG M. |\n",
|
| 210 |
"|===============================+======================+======================|\n",
|
| 211 |
"| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
|
| 212 |
-
"| N/A
|
| 213 |
"| | | Disabled |\n",
|
| 214 |
"+-------------------------------+----------------------+----------------------+\n",
|
| 215 |
" \n",
|
|
@@ -260,42 +260,43 @@
|
|
| 260 |
"name": "stdout",
|
| 261 |
"output_type": "stream",
|
| 262 |
"text": [
|
| 263 |
-
"
|
| 264 |
-
"
|
| 265 |
-
"
|
| 266 |
-
"
|
| 267 |
-
"Hit:5
|
| 268 |
-
"
|
| 269 |
-
"Hit:7
|
| 270 |
-
"Get:8
|
| 271 |
"Ign:9 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal InRelease \n",
|
| 272 |
-
"
|
| 273 |
"Hit:11 https://pkg.cloudflare.com/cloudflared focal InRelease \n",
|
| 274 |
-
"
|
| 275 |
-
"Err:13 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release \n",
|
| 276 |
" 404 Not Found [IP: 185.125.190.52 80]\n",
|
| 277 |
-
"Hit:
|
| 278 |
-
"Get:
|
| 279 |
-
"
|
|
|
|
|
|
|
| 280 |
"E: The repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\n",
|
| 281 |
"N: Updating from such a repository can't be done securely, and is therefore disabled by default.\n",
|
| 282 |
"N: See apt-secure(8) manpage for repository creation and user configuration details.\n",
|
| 283 |
-
"
|
| 284 |
-
"
|
| 285 |
-
"Hit:3 https://
|
| 286 |
"Hit:4 http://archive.lambdalabs.com/ubuntu focal InRelease \u001b[0m\n",
|
| 287 |
-
"
|
| 288 |
-
"
|
| 289 |
-
"Hit:7
|
| 290 |
-
"
|
| 291 |
-
"Hit:9 http://
|
| 292 |
-
"Hit:10 https://pkg.cloudflare.com/cloudflared focal InRelease \u001b[0m\u001b[33m\n",
|
| 293 |
-
"
|
| 294 |
-
"
|
|
|
|
| 295 |
" 404 Not Found [IP: 185.125.190.52 80]\n",
|
| 296 |
-
"Hit:
|
| 297 |
-
"
|
| 298 |
-
"Reading package lists... Done \u001b[0m33m\u001b[33m\u001b[33m\n",
|
| 299 |
"\u001b[1;31mE: \u001b[0mThe repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\u001b[0m\n",
|
| 300 |
"\u001b[33mN: \u001b[0mUpdating from such a repository can't be done securely, and is therefore disabled by default.\u001b[0m\n",
|
| 301 |
"\u001b[33mN: \u001b[0mSee apt-secure(8) manpage for repository creation and user configuration details.\u001b[0m\n",
|
|
@@ -346,33 +347,33 @@
|
|
| 346 |
"text": [
|
| 347 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 348 |
"Collecting git+https://github.com/huggingface/datasets\n",
|
| 349 |
-
" Cloning https://github.com/huggingface/datasets to /tmp/pip-req-build-
|
| 350 |
-
" Running command git clone --filter=blob:none --quiet https://github.com/huggingface/datasets /tmp/pip-req-build-
|
| 351 |
" Resolved https://github.com/huggingface/datasets to commit c902456677116a081f762fa2b4aad13a0aa04d6e\n",
|
| 352 |
" Installing build dependencies ... \u001b[?25ldone\n",
|
| 353 |
"\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
|
| 354 |
"\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
|
| 355 |
"\u001b[?25hRequirement already satisfied: dill<0.3.7 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.3.6)\n",
|
|
|
|
|
|
|
|
|
|
| 356 |
"Requirement already satisfied: packaging in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (22.0)\n",
|
| 357 |
"Requirement already satisfied: xxhash in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (3.1.0)\n",
|
| 358 |
-
"Requirement already satisfied:
|
| 359 |
-
"Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.23.5)\n",
|
| 360 |
-
"Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.5.1)\n",
|
| 361 |
-
"Requirement already satisfied: fsspec[http]>=2021.11.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2022.11.0)\n",
|
| 362 |
-
"Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from datasets==2.7.1.dev0) (5.3.1)\n",
|
| 363 |
"Requirement already satisfied: responses<0.19 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.18.0)\n",
|
|
|
|
|
|
|
|
|
|
| 364 |
"Requirement already satisfied: tqdm>=4.62.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (4.64.1)\n",
|
| 365 |
-
"Requirement already satisfied:
|
| 366 |
-
"Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2.28.1)\n",
|
| 367 |
"Requirement already satisfied: huggingface-hub<1.0.0,>=0.2.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.11.1)\n",
|
| 368 |
-
"Requirement already satisfied: multiprocess in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.70.14)\n",
|
| 369 |
-
"Requirement already satisfied: charset-normalizer<3.0,>=2.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (2.1.1)\n",
|
| 370 |
-
"Requirement already satisfied: multidict<7.0,>=4.5 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (6.0.3)\n",
|
| 371 |
-
"Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.3)\n",
|
| 372 |
-
"Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.1)\n",
|
| 373 |
"Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.8.2)\n",
|
| 374 |
-
"Requirement already satisfied:
|
|
|
|
| 375 |
"Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->datasets==2.7.1.dev0) (19.3.0)\n",
|
|
|
|
|
|
|
|
|
|
| 376 |
"Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (3.0.12)\n",
|
| 377 |
"Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (4.4.0)\n",
|
| 378 |
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->datasets==2.7.1.dev0) (2019.11.28)\n",
|
|
@@ -383,49 +384,49 @@
|
|
| 383 |
"Requirement already satisfied: six>=1.5 in /usr/lib/python3/dist-packages (from python-dateutil>=2.8.1->pandas->datasets==2.7.1.dev0) (1.14.0)\n",
|
| 384 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 385 |
"Collecting git+https://github.com/huggingface/transformers\n",
|
| 386 |
-
" Cloning https://github.com/huggingface/transformers to /tmp/pip-req-build-
|
| 387 |
-
" Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers /tmp/pip-req-build-
|
| 388 |
-
" Resolved https://github.com/huggingface/transformers to commit
|
| 389 |
" Installing build dependencies ... \u001b[?25ldone\n",
|
| 390 |
"\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
|
| 391 |
"\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
|
| 392 |
-
"\u001b[?25hRequirement already satisfied:
|
| 393 |
-
"Requirement already satisfied:
|
| 394 |
-
"Requirement already satisfied:
|
| 395 |
"Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (1.23.5)\n",
|
|
|
|
| 396 |
"Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (5.3.1)\n",
|
| 397 |
"Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (2.28.1)\n",
|
| 398 |
-
"Requirement already satisfied:
|
| 399 |
"Requirement already satisfied: tqdm>=4.27 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (4.64.1)\n",
|
| 400 |
-
"Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (3.0.12)\n",
|
| 401 |
"Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0,>=0.10.0->transformers==4.26.0.dev0) (4.4.0)\n",
|
| 402 |
-
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (1.26.13)\n",
|
| 403 |
-
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2019.11.28)\n",
|
| 404 |
-
"Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2.8)\n",
|
| 405 |
"Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (2.1.1)\n",
|
|
|
|
|
|
|
|
|
|
| 406 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 407 |
"Requirement already satisfied: librosa in ./.local/lib/python3.8/site-packages (0.9.2)\n",
|
|
|
|
| 408 |
"Requirement already satisfied: joblib>=0.14 in ./.local/lib/python3.8/site-packages (from librosa) (1.2.0)\n",
|
|
|
|
|
|
|
|
|
|
| 409 |
"Requirement already satisfied: decorator>=4.0.10 in /usr/lib/python3/dist-packages (from librosa) (4.4.2)\n",
|
| 410 |
-
"Requirement already satisfied: scipy>=1.2.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.9.3)\n",
|
| 411 |
-
"Requirement already satisfied: numba>=0.45.1 in ./.local/lib/python3.8/site-packages (from librosa) (0.56.4)\n",
|
| 412 |
"Requirement already satisfied: audioread>=2.1.9 in ./.local/lib/python3.8/site-packages (from librosa) (3.0.0)\n",
|
| 413 |
-
"Requirement already satisfied:
|
|
|
|
| 414 |
"Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from librosa) (22.0)\n",
|
| 415 |
-
"Requirement already satisfied: numpy>=1.17.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.23.5)\n",
|
| 416 |
-
"Requirement already satisfied: scikit-learn>=0.19.1 in /usr/lib/python3/dist-packages (from librosa) (0.22.2.post1)\n",
|
| 417 |
"Requirement already satisfied: resampy>=0.2.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.4.2)\n",
|
| 418 |
-
"Requirement already satisfied: soundfile>=0.10.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.11.0)\n",
|
| 419 |
"Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from numba>=0.45.1->librosa) (45.2.0)\n",
|
| 420 |
-
"Requirement already satisfied: importlib-metadata in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (5.0.0)\n",
|
| 421 |
"Requirement already satisfied: llvmlite<0.40,>=0.39.0dev0 in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (0.39.1)\n",
|
| 422 |
-
"Requirement already satisfied:
|
| 423 |
"Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from pooch>=1.0->librosa) (2.28.1)\n",
|
|
|
|
| 424 |
"Requirement already satisfied: cffi>=1.0 in /usr/lib/python3/dist-packages (from soundfile>=0.10.2->librosa) (1.14.0)\n",
|
| 425 |
-
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (1.26.13)\n",
|
| 426 |
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2019.11.28)\n",
|
| 427 |
-
"Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.1.1)\n",
|
| 428 |
"Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.8)\n",
|
|
|
|
|
|
|
| 429 |
"Requirement already satisfied: zipp>=0.5 in /usr/lib/python3/dist-packages (from importlib-metadata->numba>=0.45.1->librosa) (1.0.0)\n",
|
| 430 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 431 |
"Requirement already satisfied: jiwer in ./.local/lib/python3.8/site-packages (2.5.1)\n",
|
|
@@ -433,59 +434,59 @@
|
|
| 433 |
"Requirement already satisfied: rapidfuzz<3.0.0,>=2.3.0 in ./.local/lib/python3.8/site-packages (from levenshtein==0.20.2->jiwer) (2.13.6)\n",
|
| 434 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 435 |
"Requirement already satisfied: gradio in ./.local/lib/python3.8/site-packages (3.13.0)\n",
|
| 436 |
-
"Requirement already satisfied:
|
| 437 |
-
"Requirement already satisfied: uvicorn in ./.local/lib/python3.8/site-packages (from gradio) (0.20.0)\n",
|
| 438 |
-
"Requirement already satisfied: markdown-it-py[linkify,plugins] in ./.local/lib/python3.8/site-packages (from gradio) (2.1.0)\n",
|
| 439 |
-
"Requirement already satisfied: pillow in /usr/lib/python3/dist-packages (from gradio) (7.0.0)\n",
|
| 440 |
-
"Requirement already satisfied: paramiko in ./.local/lib/python3.8/site-packages (from gradio) (2.12.0)\n",
|
| 441 |
"Requirement already satisfied: aiohttp in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
|
| 442 |
-
"Requirement already satisfied: matplotlib in ./.local/lib/python3.8/site-packages (from gradio) (3.5.3)\n",
|
| 443 |
-
"Requirement already satisfied: fsspec in ./.local/lib/python3.8/site-packages (from gradio) (2022.11.0)\n",
|
| 444 |
-
"Requirement already satisfied: websockets>=10.0 in ./.local/lib/python3.8/site-packages (from gradio) (10.4)\n",
|
| 445 |
"Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from gradio) (1.5.1)\n",
|
| 446 |
-
"Requirement already satisfied: httpx in ./.local/lib/python3.8/site-packages (from gradio) (0.23.1)\n",
|
| 447 |
-
"Requirement already satisfied: python-multipart in ./.local/lib/python3.8/site-packages (from gradio) (0.0.5)\n",
|
| 448 |
-
"Requirement already satisfied: jinja2 in ./.local/lib/python3.8/site-packages (from gradio) (3.1.2)\n",
|
| 449 |
-
"Requirement already satisfied: orjson in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
|
| 450 |
-
"Requirement already satisfied: ffmpy in ./.local/lib/python3.8/site-packages (from gradio) (0.3.0)\n",
|
| 451 |
-
"Requirement already satisfied: pydantic in ./.local/lib/python3.8/site-packages (from gradio) (1.10.2)\n",
|
| 452 |
"Requirement already satisfied: pydub in ./.local/lib/python3.8/site-packages (from gradio) (0.25.1)\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 453 |
"Requirement already satisfied: h11<0.13,>=0.11 in ./.local/lib/python3.8/site-packages (from gradio) (0.12.0)\n",
|
| 454 |
-
"Requirement already satisfied: pyyaml in /usr/lib/python3/dist-packages (from gradio) (5.3.1)\n",
|
| 455 |
"Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from gradio) (2.28.1)\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 456 |
"Requirement already satisfied: pycryptodome in ./.local/lib/python3.8/site-packages (from gradio) (3.16.0)\n",
|
| 457 |
-
"Requirement already satisfied:
|
| 458 |
-
"Requirement already satisfied:
|
| 459 |
-
"Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (4.0.2)\n",
|
| 460 |
"Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.3)\n",
|
| 461 |
"Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->gradio) (19.3.0)\n",
|
| 462 |
-
"Requirement already satisfied:
|
|
|
|
| 463 |
"Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.8.2)\n",
|
| 464 |
-
"Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.1)\n",
|
| 465 |
"Requirement already satisfied: starlette==0.22.0 in ./.local/lib/python3.8/site-packages (from fastapi->gradio) (0.22.0)\n",
|
| 466 |
"Requirement already satisfied: typing-extensions>=3.10.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (4.4.0)\n",
|
| 467 |
"Requirement already satisfied: anyio<5,>=3.4.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (3.6.2)\n",
|
| 468 |
-
"Requirement already satisfied: httpcore<0.17.0,>=0.15.0 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (0.15.0)\n",
|
| 469 |
-
"Requirement already satisfied: certifi in /usr/lib/python3/dist-packages (from httpx->gradio) (2019.11.28)\n",
|
| 470 |
"Requirement already satisfied: rfc3986[idna2008]<2,>=1.3 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.5.0)\n",
|
| 471 |
"Requirement already satisfied: sniffio in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.3.0)\n",
|
|
|
|
|
|
|
| 472 |
"Requirement already satisfied: MarkupSafe>=2.0 in ./.local/lib/python3.8/site-packages (from jinja2->gradio) (2.1.1)\n",
|
| 473 |
"Requirement already satisfied: mdurl~=0.1 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.1.2)\n",
|
| 474 |
-
"Requirement already satisfied: mdit-py-plugins in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.3.3)\n",
|
| 475 |
"Requirement already satisfied: linkify-it-py~=1.0 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (1.0.3)\n",
|
| 476 |
-
"Requirement already satisfied:
|
|
|
|
| 477 |
"Requirement already satisfied: kiwisolver>=1.0.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (1.0.1)\n",
|
| 478 |
-
"Requirement already satisfied: pyparsing>=2.2.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (2.4.6)\n",
|
| 479 |
"Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (22.0)\n",
|
| 480 |
-
"Requirement already satisfied: python-dateutil>=2.7 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (2.8.2)\n",
|
| 481 |
"Requirement already satisfied: cycler>=0.10 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (0.10.0)\n",
|
|
|
|
|
|
|
| 482 |
"Requirement already satisfied: pytz>=2020.1 in ./.local/lib/python3.8/site-packages (from pandas->gradio) (2022.5)\n",
|
|
|
|
| 483 |
"Requirement already satisfied: six in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.14.0)\n",
|
| 484 |
"Requirement already satisfied: pynacl>=1.0.1 in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.3.0)\n",
|
| 485 |
-
"Requirement already satisfied: bcrypt>=3.1.3 in ./.local/lib/python3.8/site-packages (from paramiko->gradio) (4.0.1)\n",
|
| 486 |
"Requirement already satisfied: cryptography>=2.5 in /usr/lib/python3/dist-packages (from paramiko->gradio) (2.8)\n",
|
| 487 |
-
"Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->gradio) (2.8)\n",
|
| 488 |
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->gradio) (1.26.13)\n",
|
|
|
|
| 489 |
"Requirement already satisfied: click>=7.0 in /usr/lib/python3/dist-packages (from uvicorn->gradio) (7.0)\n",
|
| 490 |
"Requirement already satisfied: uc-micro-py in ./.local/lib/python3.8/site-packages (from linkify-it-py~=1.0->markdown-it-py[linkify,plugins]->gradio) (1.0.1)\n",
|
| 491 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
|
@@ -554,7 +555,7 @@
|
|
| 554 |
{
|
| 555 |
"data": {
|
| 556 |
"application/vnd.jupyter.widget-view+json": {
|
| 557 |
-
"model_id": "
|
| 558 |
"version_major": 2,
|
| 559 |
"version_minor": 0
|
| 560 |
},
|
|
@@ -713,7 +714,7 @@
|
|
| 713 |
" all_datasets = []\n",
|
| 714 |
" # iterate over the datasets we want to interleave\n",
|
| 715 |
" for i, dataset_name in enumerate(dataset_names):\n",
|
| 716 |
-
" dataset = load_dataset(dataset_name, dataset_config_names[i], split=splits[i], streaming=
|
| 717 |
" # resample to specified sampling rate\n",
|
| 718 |
" dataset = dataset.cast_column(\"audio\", Audio(sampling_rate))\n",
|
| 719 |
" # normalise columns to [\"audio\", \"sentence\"]\n",
|
|
@@ -738,16 +739,7 @@
|
|
| 738 |
"id": "qOwlctMhNmCG",
|
| 739 |
"tags": []
|
| 740 |
},
|
| 741 |
-
"outputs": [
|
| 742 |
-
{
|
| 743 |
-
"name": "stderr",
|
| 744 |
-
"output_type": "stream",
|
| 745 |
-
"text": [
|
| 746 |
-
"Found cached dataset common_voice_11_0 (/home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f)\n",
|
| 747 |
-
"Found cached dataset fleurs (/home/ubuntu/.cache/huggingface/datasets/google___fleurs/el_gr/2.0.0/aabb39fb29739c495517ac904e2886819b6e344702f0a5b5283cb178b087c94a)\n"
|
| 748 |
-
]
|
| 749 |
-
}
|
| 750 |
-
],
|
| 751 |
"source": [
|
| 752 |
"ds = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
|
| 753 |
"\n"
|
|
@@ -770,23 +762,13 @@
|
|
| 770 |
"metadata": {
|
| 771 |
"id": "imRHJOpm4V_j"
|
| 772 |
},
|
| 773 |
-
"outputs": [
|
| 774 |
-
{
|
| 775 |
-
"name": "stderr",
|
| 776 |
-
"output_type": "stream",
|
| 777 |
-
"text": [
|
| 778 |
-
"Found cached dataset common_voice_11_0 (/home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f)\n",
|
| 779 |
-
"Found cached dataset fleurs (/home/ubuntu/.cache/huggingface/datasets/google___fleurs/el_gr/2.0.0/aabb39fb29739c495517ac904e2886819b6e344702f0a5b5283cb178b087c94a)\n",
|
| 780 |
-
"Found cached dataset common_voice_11_0 (/home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f)\n"
|
| 781 |
-
]
|
| 782 |
-
}
|
| 783 |
-
],
|
| 784 |
"source": [
|
| 785 |
"from datasets import IterableDatasetDict\n",
|
| 786 |
"raw_datasets = IterableDatasetDict()\n",
|
| 787 |
"\n",
|
| 788 |
"raw_datasets[\"train\"] = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
|
| 789 |
-
"raw_datasets[\"test\"] = load_dataset(\"mozilla-foundation/common_voice_11_0\", \"el\", split=\"test\", streaming=
|
| 790 |
"\n",
|
| 791 |
"\n",
|
| 792 |
"#raw_datasets = raw_datasets.remove_columns([\"accent\", \"age\", \"client_id\", \"down_votes\", \"gender\", \"locale\", \"path\", \"segment\", \"up_votes\"])\n",
|
|
@@ -1013,29 +995,7 @@
|
|
| 1013 |
"metadata": {
|
| 1014 |
"id": "a37a7cdb-9013-427f-8de9-6a8d0e9dc684"
|
| 1015 |
},
|
| 1016 |
-
"outputs": [
|
| 1017 |
-
{
|
| 1018 |
-
"data": {
|
| 1019 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 1020 |
-
"model_id": "5eb200f925f84e14bc08341ee8620fd9",
|
| 1021 |
-
"version_major": 2,
|
| 1022 |
-
"version_minor": 0
|
| 1023 |
-
},
|
| 1024 |
-
"text/plain": [
|
| 1025 |
-
" 0%| | 0/6430 [00:00<?, ?ex/s]"
|
| 1026 |
-
]
|
| 1027 |
-
},
|
| 1028 |
-
"metadata": {},
|
| 1029 |
-
"output_type": "display_data"
|
| 1030 |
-
},
|
| 1031 |
-
{
|
| 1032 |
-
"name": "stderr",
|
| 1033 |
-
"output_type": "stream",
|
| 1034 |
-
"text": [
|
| 1035 |
-
"Loading cached processed dataset at /home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f/cache-52a8b70c074fdab6.arrow\n"
|
| 1036 |
-
]
|
| 1037 |
-
}
|
| 1038 |
-
],
|
| 1039 |
"source": [
|
| 1040 |
"vectorized_datasets = raw_datasets.map(prepare_dataset, remove_columns=list(next(iter(raw_datasets.values())).features)).with_format(\"torch\")"
|
| 1041 |
]
|
|
@@ -1052,32 +1012,12 @@
|
|
| 1052 |
},
|
| 1053 |
{
|
| 1054 |
"cell_type": "code",
|
| 1055 |
-
"execution_count":
|
| 1056 |
"id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c",
|
| 1057 |
"metadata": {
|
| 1058 |
"id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c"
|
| 1059 |
},
|
| 1060 |
-
"outputs": [
|
| 1061 |
-
{
|
| 1062 |
-
"name": "stdout",
|
| 1063 |
-
"output_type": "stream",
|
| 1064 |
-
"text": [
|
| 1065 |
-
"{'input_features': tensor([[-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
|
| 1066 |
-
" [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
|
| 1067 |
-
" [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
|
| 1068 |
-
" ...,\n",
|
| 1069 |
-
" [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
|
| 1070 |
-
" [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
|
| 1071 |
-
" [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154]]), 'input_length': tensor(6.6000), 'labels': tensor([50258, 50281, 50359, 50363, 7068, 26263, 11383, 3596, 2080, 3659,\n",
|
| 1072 |
-
" 10073, 30599, 5691, 6744, 8828, 11658, 3371, 17321, 30320, 11383,\n",
|
| 1073 |
-
" 3659, 5337, 4339, 20511, 4915, 3371, 33908, 44035, 3721, 19264,\n",
|
| 1074 |
-
" 25090, 7597, 17928, 24841, 8385, 3835, 4903, 2080, 2805, 8385,\n",
|
| 1075 |
-
" 3721, 39320, 8335, 3596, 21457, 4339, 5074, 1800, 8715, 6956,\n",
|
| 1076 |
-
" 1800, 5958, 14836, 8385, 1800, 34079, 8385, 16946, 8066, 5733,\n",
|
| 1077 |
-
" 24296, 9137, 9903, 50257])}\n"
|
| 1078 |
-
]
|
| 1079 |
-
}
|
| 1080 |
-
],
|
| 1081 |
"source": [
|
| 1082 |
"vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].shuffle(\n",
|
| 1083 |
" #buffer_size=500,\n",
|
|
@@ -1100,7 +1040,7 @@
|
|
| 1100 |
},
|
| 1101 |
{
|
| 1102 |
"cell_type": "code",
|
| 1103 |
-
"execution_count":
|
| 1104 |
"id": "01cb25ef-4bb0-4325-9461-f59198acadf6",
|
| 1105 |
"metadata": {
|
| 1106 |
"id": "01cb25ef-4bb0-4325-9461-f59198acadf6"
|
|
@@ -1125,27 +1065,12 @@
|
|
| 1125 |
},
|
| 1126 |
{
|
| 1127 |
"cell_type": "code",
|
| 1128 |
-
"execution_count":
|
| 1129 |
"id": "333f7f6e-6053-4d3b-8924-c733c79b82ac",
|
| 1130 |
"metadata": {
|
| 1131 |
"id": "333f7f6e-6053-4d3b-8924-c733c79b82ac"
|
| 1132 |
},
|
| 1133 |
-
"outputs": [
|
| 1134 |
-
{
|
| 1135 |
-
"data": {
|
| 1136 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 1137 |
-
"model_id": "aefbdf517ed24020b4fd372739f37e5f",
|
| 1138 |
-
"version_major": 2,
|
| 1139 |
-
"version_minor": 0
|
| 1140 |
-
},
|
| 1141 |
-
"text/plain": [
|
| 1142 |
-
" 0%| | 0/7 [00:00<?, ?ba/s]"
|
| 1143 |
-
]
|
| 1144 |
-
},
|
| 1145 |
-
"metadata": {},
|
| 1146 |
-
"output_type": "display_data"
|
| 1147 |
-
}
|
| 1148 |
-
],
|
| 1149 |
"source": [
|
| 1150 |
"vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].filter(\n",
|
| 1151 |
" is_audio_in_length_range,\n",
|
|
@@ -1220,7 +1145,7 @@
|
|
| 1220 |
},
|
| 1221 |
{
|
| 1222 |
"cell_type": "code",
|
| 1223 |
-
"execution_count":
|
| 1224 |
"id": "8326221e-ec13-4731-bb4e-51e5fc1486c5",
|
| 1225 |
"metadata": {
|
| 1226 |
"id": "8326221e-ec13-4731-bb4e-51e5fc1486c5"
|
|
@@ -1272,7 +1197,7 @@
|
|
| 1272 |
},
|
| 1273 |
{
|
| 1274 |
"cell_type": "code",
|
| 1275 |
-
"execution_count":
|
| 1276 |
"id": "fc834702-c0d3-4a96-b101-7b87be32bf42",
|
| 1277 |
"metadata": {
|
| 1278 |
"id": "fc834702-c0d3-4a96-b101-7b87be32bf42"
|
|
@@ -1305,7 +1230,7 @@
|
|
| 1305 |
},
|
| 1306 |
{
|
| 1307 |
"cell_type": "code",
|
| 1308 |
-
"execution_count":
|
| 1309 |
"id": "b22b4011-f31f-4b57-b684-c52332f92890",
|
| 1310 |
"metadata": {
|
| 1311 |
"colab": {
|
|
@@ -1356,7 +1281,7 @@
|
|
| 1356 |
},
|
| 1357 |
{
|
| 1358 |
"cell_type": "code",
|
| 1359 |
-
"execution_count":
|
| 1360 |
"id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb",
|
| 1361 |
"metadata": {
|
| 1362 |
"id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb"
|
|
@@ -1405,7 +1330,7 @@
|
|
| 1405 |
},
|
| 1406 |
{
|
| 1407 |
"cell_type": "code",
|
| 1408 |
-
"execution_count":
|
| 1409 |
"id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
|
| 1410 |
"metadata": {
|
| 1411 |
"colab": {
|
|
@@ -1443,21 +1368,7 @@
|
|
| 1443 |
{
|
| 1444 |
"data": {
|
| 1445 |
"application/vnd.jupyter.widget-view+json": {
|
| 1446 |
-
"model_id": "
|
| 1447 |
-
"version_major": 2,
|
| 1448 |
-
"version_minor": 0
|
| 1449 |
-
},
|
| 1450 |
-
"text/plain": [
|
| 1451 |
-
"Downloading: 0%| | 0.00/1.04k [00:00<?, ?B/s]"
|
| 1452 |
-
]
|
| 1453 |
-
},
|
| 1454 |
-
"metadata": {},
|
| 1455 |
-
"output_type": "display_data"
|
| 1456 |
-
},
|
| 1457 |
-
{
|
| 1458 |
-
"data": {
|
| 1459 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 1460 |
-
"model_id": "f8c10225aa194c909eeb19170ac75d1f",
|
| 1461 |
"version_major": 2,
|
| 1462 |
"version_minor": 0
|
| 1463 |
},
|
|
@@ -1490,7 +1401,7 @@
|
|
| 1490 |
},
|
| 1491 |
{
|
| 1492 |
"cell_type": "code",
|
| 1493 |
-
"execution_count":
|
| 1494 |
"id": "62038ba3-88ed-4fce-84db-338f50dcd04f",
|
| 1495 |
"metadata": {
|
| 1496 |
"id": "62038ba3-88ed-4fce-84db-338f50dcd04f"
|
|
@@ -1527,7 +1438,7 @@
|
|
| 1527 |
},
|
| 1528 |
{
|
| 1529 |
"cell_type": "code",
|
| 1530 |
-
"execution_count":
|
| 1531 |
"id": "0ae3e9af-97b7-4aa0-ae85-20b23b5bcb3a",
|
| 1532 |
"metadata": {
|
| 1533 |
"colab": {
|
|
@@ -1570,7 +1481,7 @@
|
|
| 1570 |
},
|
| 1571 |
{
|
| 1572 |
"cell_type": "code",
|
| 1573 |
-
"execution_count":
|
| 1574 |
"id": "o72eOpGzD_sK",
|
| 1575 |
"metadata": {
|
| 1576 |
"colab": {
|
|
@@ -1584,7 +1495,7 @@
|
|
| 1584 |
"name": "stdout",
|
| 1585 |
"output_type": "stream",
|
| 1586 |
"text": [
|
| 1587 |
-
"Tue Dec 13
|
| 1588 |
"+-----------------------------------------------------------------------------+\n",
|
| 1589 |
"| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
|
| 1590 |
"|-------------------------------+----------------------+----------------------+\n",
|
|
@@ -1593,7 +1504,7 @@
|
|
| 1593 |
"| | | MIG M. |\n",
|
| 1594 |
"|===============================+======================+======================|\n",
|
| 1595 |
"| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
|
| 1596 |
-
"| N/A
|
| 1597 |
"| | | Disabled |\n",
|
| 1598 |
"+-------------------------------+----------------------+----------------------+\n",
|
| 1599 |
" \n",
|
|
@@ -1634,7 +1545,7 @@
|
|
| 1634 |
},
|
| 1635 |
{
|
| 1636 |
"cell_type": "code",
|
| 1637 |
-
"execution_count":
|
| 1638 |
"id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2",
|
| 1639 |
"metadata": {
|
| 1640 |
"id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2"
|
|
@@ -1667,7 +1578,7 @@
|
|
| 1667 |
},
|
| 1668 |
{
|
| 1669 |
"cell_type": "code",
|
| 1670 |
-
"execution_count":
|
| 1671 |
"id": "d546d7fe-0543-479a-b708-2ebabec19493",
|
| 1672 |
"metadata": {
|
| 1673 |
"colab": {
|
|
@@ -2281,7 +2192,7 @@
|
|
| 2281 |
},
|
| 2282 |
{
|
| 2283 |
"cell_type": "code",
|
| 2284 |
-
"execution_count":
|
| 2285 |
"id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672",
|
| 2286 |
"metadata": {
|
| 2287 |
"id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672"
|
|
@@ -2374,21 +2285,22 @@
|
|
| 2374 |
"name": "stderr",
|
| 2375 |
"output_type": "stream",
|
| 2376 |
"text": [
|
| 2377 |
-
"Loading model from ./whisper-medium-el/checkpoint-
|
| 2378 |
-
"The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
|
| 2379 |
"/home/ubuntu/.local/lib/python3.8/site-packages/transformers/optimization.py:306: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
|
| 2380 |
" warnings.warn(\n",
|
| 2381 |
"***** Running training *****\n",
|
| 2382 |
-
" Num examples =
|
| 2383 |
-
" Num Epochs =
|
| 2384 |
" Instantaneous batch size per device = 32\n",
|
| 2385 |
" Total train batch size (w. parallel, distributed & accumulation) = 32\n",
|
| 2386 |
" Gradient Accumulation steps = 1\n",
|
| 2387 |
" Total optimization steps = 5000\n",
|
| 2388 |
" Number of trainable parameters = 763857920\n",
|
| 2389 |
" Continuing training from checkpoint, will skip to saved global_step\n",
|
| 2390 |
-
" Continuing training from epoch
|
| 2391 |
-
" Continuing training from global step
|
|
|
|
|
|
|
| 2392 |
]
|
| 2393 |
},
|
| 2394 |
{
|
|
@@ -2397,8 +2309,8 @@
|
|
| 2397 |
"\n",
|
| 2398 |
" <div>\n",
|
| 2399 |
" \n",
|
| 2400 |
-
" <progress value='
|
| 2401 |
-
" [
|
| 2402 |
" </div>\n",
|
| 2403 |
" <table border=\"1\" class=\"dataframe\">\n",
|
| 2404 |
" <thead>\n",
|
|
@@ -2406,16 +2318,9 @@
|
|
| 2406 |
" <th>Step</th>\n",
|
| 2407 |
" <th>Training Loss</th>\n",
|
| 2408 |
" <th>Validation Loss</th>\n",
|
| 2409 |
-
" <th>Wer</th>\n",
|
| 2410 |
" </tr>\n",
|
| 2411 |
" </thead>\n",
|
| 2412 |
" <tbody>\n",
|
| 2413 |
-
" <tr>\n",
|
| 2414 |
-
" <td>4000</td>\n",
|
| 2415 |
-
" <td>0.000300</td>\n",
|
| 2416 |
-
" <td>0.367278</td>\n",
|
| 2417 |
-
" <td>11.534175</td>\n",
|
| 2418 |
-
" </tr>\n",
|
| 2419 |
" </tbody>\n",
|
| 2420 |
"</table><p>"
|
| 2421 |
],
|
|
@@ -2425,27 +2330,6 @@
|
|
| 2425 |
},
|
| 2426 |
"metadata": {},
|
| 2427 |
"output_type": "display_data"
|
| 2428 |
-
},
|
| 2429 |
-
{
|
| 2430 |
-
"name": "stderr",
|
| 2431 |
-
"output_type": "stream",
|
| 2432 |
-
"text": [
|
| 2433 |
-
"The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: path, input_length, gender, accent, up_votes, client_id, locale, age, segment, down_votes. If path, input_length, gender, accent, up_votes, client_id, locale, age, segment, down_votes are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
|
| 2434 |
-
"***** Running Evaluation *****\n",
|
| 2435 |
-
" Num examples = 1696\n",
|
| 2436 |
-
" Batch size = 16\n",
|
| 2437 |
-
"Saving model checkpoint to ./whisper-medium-el/checkpoint-4000\n",
|
| 2438 |
-
"Configuration saved in ./whisper-medium-el/checkpoint-4000/config.json\n",
|
| 2439 |
-
"Model weights saved in ./whisper-medium-el/checkpoint-4000/pytorch_model.bin\n",
|
| 2440 |
-
"Feature extractor saved in ./whisper-medium-el/checkpoint-4000/preprocessor_config.json\n",
|
| 2441 |
-
"tokenizer config file saved in ./whisper-medium-el/checkpoint-4000/tokenizer_config.json\n",
|
| 2442 |
-
"Special tokens file saved in ./whisper-medium-el/checkpoint-4000/special_tokens_map.json\n",
|
| 2443 |
-
"added tokens file saved in ./whisper-medium-el/checkpoint-4000/added_tokens.json\n",
|
| 2444 |
-
"Feature extractor saved in ./whisper-medium-el/preprocessor_config.json\n",
|
| 2445 |
-
"tokenizer config file saved in ./whisper-medium-el/tokenizer_config.json\n",
|
| 2446 |
-
"Special tokens file saved in ./whisper-medium-el/special_tokens_map.json\n",
|
| 2447 |
-
"added tokens file saved in ./whisper-medium-el/added_tokens.json\n"
|
| 2448 |
-
]
|
| 2449 |
}
|
| 2450 |
],
|
| 2451 |
"source": [
|
|
|
|
| 125 |
"Requirement already satisfied: torch in ./.local/lib/python3.8/site-packages (1.13.0)\n",
|
| 126 |
"Requirement already satisfied: torchaudio in ./.local/lib/python3.8/site-packages (0.13.0)\n",
|
| 127 |
"Requirement already satisfied: torchvision in ./.local/lib/python3.8/site-packages (0.14.0)\n",
|
| 128 |
+
"Requirement already satisfied: nvidia-cuda-runtime-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
|
| 129 |
+
"Requirement already satisfied: nvidia-cudnn-cu11==8.5.0.96 in ./.local/lib/python3.8/site-packages (from torch) (8.5.0.96)\n",
|
| 130 |
"Requirement already satisfied: nvidia-cublas-cu11==11.10.3.66 in ./.local/lib/python3.8/site-packages (from torch) (11.10.3.66)\n",
|
|
|
|
| 131 |
"Requirement already satisfied: typing-extensions in ./.local/lib/python3.8/site-packages (from torch) (4.4.0)\n",
|
| 132 |
+
"Requirement already satisfied: nvidia-cuda-nvrtc-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
|
|
|
|
|
|
|
| 133 |
"Requirement already satisfied: wheel in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (0.34.2)\n",
|
| 134 |
+
"Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (45.2.0)\n",
|
| 135 |
"Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /usr/lib/python3/dist-packages (from torchvision) (7.0.0)\n",
|
| 136 |
+
"Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from torchvision) (2.28.1)\n",
|
| 137 |
"Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from torchvision) (1.23.5)\n",
|
|
|
|
| 138 |
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->torchvision) (2019.11.28)\n",
|
| 139 |
+
"Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests->torchvision) (2.1.1)\n",
|
| 140 |
+
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->torchvision) (1.26.13)\n",
|
| 141 |
+
"Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->torchvision) (2.8)\n"
|
| 142 |
]
|
| 143 |
}
|
| 144 |
],
|
|
|
|
| 200 |
"name": "stdout",
|
| 201 |
"output_type": "stream",
|
| 202 |
"text": [
|
| 203 |
+
"Tue Dec 13 21:26:01 2022 \n",
|
| 204 |
"+-----------------------------------------------------------------------------+\n",
|
| 205 |
"| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
|
| 206 |
"|-------------------------------+----------------------+----------------------+\n",
|
|
|
|
| 209 |
"| | | MIG M. |\n",
|
| 210 |
"|===============================+======================+======================|\n",
|
| 211 |
"| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
|
| 212 |
+
"| N/A 41C P0 50W / 400W | 0MiB / 40960MiB | 0% Default |\n",
|
| 213 |
"| | | Disabled |\n",
|
| 214 |
"+-------------------------------+----------------------+----------------------+\n",
|
| 215 |
" \n",
|
|
|
|
| 260 |
"name": "stdout",
|
| 261 |
"output_type": "stream",
|
| 262 |
"text": [
|
| 263 |
+
"Get:1 https://nvidia.github.io/libnvidia-container/stable/ubuntu18.04/amd64 InRelease [1484 B]\n",
|
| 264 |
+
"Hit:2 https://nvidia.github.io/nvidia-container-runtime/stable/ubuntu18.04/amd64 InRelease\n",
|
| 265 |
+
"Get:3 https://packages.cloud.google.com/apt cloud-sdk InRelease [6751 B] \n",
|
| 266 |
+
"Hit:4 http://archive.lambdalabs.com/ubuntu focal InRelease \n",
|
| 267 |
+
"Hit:5 https://download.docker.com/linux/ubuntu focal InRelease \n",
|
| 268 |
+
"Hit:6 https://packages.microsoft.com/repos/azure-cli focal InRelease \n",
|
| 269 |
+
"Hit:7 http://archive.ubuntu.com/ubuntu focal InRelease \n",
|
| 270 |
+
"Get:8 http://security.ubuntu.com/ubuntu focal-security InRelease [114 kB] \n",
|
| 271 |
"Ign:9 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal InRelease \n",
|
| 272 |
+
"Get:10 http://archive.ubuntu.com/ubuntu focal-updates InRelease [114 kB] \n",
|
| 273 |
"Hit:11 https://pkg.cloudflare.com/cloudflared focal InRelease \n",
|
| 274 |
+
"Err:12 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release \n",
|
|
|
|
| 275 |
" 404 Not Found [IP: 185.125.190.52 80]\n",
|
| 276 |
+
"Hit:13 https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu focal InRelease \n",
|
| 277 |
+
"Get:14 http://archive.ubuntu.com/ubuntu focal-backports InRelease [108 kB] \n",
|
| 278 |
+
"Get:15 http://archive.ubuntu.com/ubuntu focal-updates/main amd64 Packages [2269 kB]\n",
|
| 279 |
+
"Get:16 http://archive.ubuntu.com/ubuntu focal-updates/universe amd64 Packages [1009 kB]\n",
|
| 280 |
+
"Reading package lists... Done \n",
|
| 281 |
"E: The repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\n",
|
| 282 |
"N: Updating from such a repository can't be done securely, and is therefore disabled by default.\n",
|
| 283 |
"N: See apt-secure(8) manpage for repository creation and user configuration details.\n",
|
| 284 |
+
"Get:1 https://nvidia.github.io/libnvidia-container/stable/ubuntu18.04/amd64 InRelease [1484 B]\n",
|
| 285 |
+
"Hit:2 https://nvidia.github.io/nvidia-container-runtime/stable/ubuntu18.04/amd64 InRelease\n",
|
| 286 |
+
"Hit:3 https://packages.cloud.google.com/apt cloud-sdk InRelease \u001b[0m\u001b[33m\n",
|
| 287 |
"Hit:4 http://archive.lambdalabs.com/ubuntu focal InRelease \u001b[0m\n",
|
| 288 |
+
"Hit:5 https://download.docker.com/linux/ubuntu focal InRelease \u001b[0m\n",
|
| 289 |
+
"Ign:6 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal InRelease \u001b[0m\u001b[33m\u001b[33m\u001b[33m\n",
|
| 290 |
+
"Hit:7 http://archive.ubuntu.com/ubuntu focal InRelease \u001b[0m\n",
|
| 291 |
+
"Hit:8 https://packages.microsoft.com/repos/azure-cli focal InRelease \u001b[0m\n",
|
| 292 |
+
"Hit:9 http://security.ubuntu.com/ubuntu focal-security InRelease \u001b[0m\n",
|
| 293 |
+
"Hit:10 https://pkg.cloudflare.com/cloudflared focal InRelease \u001b[0m\u001b[33m\u001b[33m\n",
|
| 294 |
+
"Hit:11 http://archive.ubuntu.com/ubuntu focal-updates InRelease \u001b[0m\n",
|
| 295 |
+
"Hit:12 http://archive.ubuntu.com/ubuntu focal-backports InRelease \u001b[0m \u001b[0m\u001b[33m\u001b[33m\u001b[33m\n",
|
| 296 |
+
"Err:13 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release\n",
|
| 297 |
" 404 Not Found [IP: 185.125.190.52 80]\n",
|
| 298 |
+
"Hit:14 https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu focal InRelease\n",
|
| 299 |
+
"Reading package lists... Done\u001b[33m\u001b[33m\n",
|
|
|
|
| 300 |
"\u001b[1;31mE: \u001b[0mThe repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\u001b[0m\n",
|
| 301 |
"\u001b[33mN: \u001b[0mUpdating from such a repository can't be done securely, and is therefore disabled by default.\u001b[0m\n",
|
| 302 |
"\u001b[33mN: \u001b[0mSee apt-secure(8) manpage for repository creation and user configuration details.\u001b[0m\n",
|
|
|
|
| 347 |
"text": [
|
| 348 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 349 |
"Collecting git+https://github.com/huggingface/datasets\n",
|
| 350 |
+
" Cloning https://github.com/huggingface/datasets to /tmp/pip-req-build-ju8bkpld\n",
|
| 351 |
+
" Running command git clone --filter=blob:none --quiet https://github.com/huggingface/datasets /tmp/pip-req-build-ju8bkpld\n",
|
| 352 |
" Resolved https://github.com/huggingface/datasets to commit c902456677116a081f762fa2b4aad13a0aa04d6e\n",
|
| 353 |
" Installing build dependencies ... \u001b[?25ldone\n",
|
| 354 |
"\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
|
| 355 |
"\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
|
| 356 |
"\u001b[?25hRequirement already satisfied: dill<0.3.7 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.3.6)\n",
|
| 357 |
+
"Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2.28.1)\n",
|
| 358 |
+
"Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.23.5)\n",
|
| 359 |
+
"Requirement already satisfied: aiohttp in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (3.8.3)\n",
|
| 360 |
"Requirement already satisfied: packaging in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (22.0)\n",
|
| 361 |
"Requirement already satisfied: xxhash in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (3.1.0)\n",
|
| 362 |
+
"Requirement already satisfied: pyarrow>=6.0.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (10.0.1)\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
| 363 |
"Requirement already satisfied: responses<0.19 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.18.0)\n",
|
| 364 |
+
"Requirement already satisfied: multiprocess in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.70.14)\n",
|
| 365 |
+
"Requirement already satisfied: fsspec[http]>=2021.11.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2022.11.0)\n",
|
| 366 |
+
"Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.5.1)\n",
|
| 367 |
"Requirement already satisfied: tqdm>=4.62.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (4.64.1)\n",
|
| 368 |
+
"Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from datasets==2.7.1.dev0) (5.3.1)\n",
|
|
|
|
| 369 |
"Requirement already satisfied: huggingface-hub<1.0.0,>=0.2.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.11.1)\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 370 |
"Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.8.2)\n",
|
| 371 |
+
"Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.1)\n",
|
| 372 |
+
"Requirement already satisfied: multidict<7.0,>=4.5 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (6.0.3)\n",
|
| 373 |
"Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->datasets==2.7.1.dev0) (19.3.0)\n",
|
| 374 |
+
"Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (4.0.2)\n",
|
| 375 |
+
"Requirement already satisfied: charset-normalizer<3.0,>=2.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (2.1.1)\n",
|
| 376 |
+
"Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.3)\n",
|
| 377 |
"Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (3.0.12)\n",
|
| 378 |
"Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (4.4.0)\n",
|
| 379 |
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->datasets==2.7.1.dev0) (2019.11.28)\n",
|
|
|
|
| 384 |
"Requirement already satisfied: six>=1.5 in /usr/lib/python3/dist-packages (from python-dateutil>=2.8.1->pandas->datasets==2.7.1.dev0) (1.14.0)\n",
|
| 385 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 386 |
"Collecting git+https://github.com/huggingface/transformers\n",
|
| 387 |
+
" Cloning https://github.com/huggingface/transformers to /tmp/pip-req-build-9scgt3ru\n",
|
| 388 |
+
" Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers /tmp/pip-req-build-9scgt3ru\n",
|
| 389 |
+
" Resolved https://github.com/huggingface/transformers to commit d994473b05a83ea398d9f10ca458855df095e22d\n",
|
| 390 |
" Installing build dependencies ... \u001b[?25ldone\n",
|
| 391 |
"\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
|
| 392 |
"\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
|
| 393 |
+
"\u001b[?25hRequirement already satisfied: tokenizers!=0.11.3,<0.14,>=0.11.1 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (0.13.2)\n",
|
| 394 |
+
"Requirement already satisfied: huggingface-hub<1.0,>=0.10.0 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (0.11.1)\n",
|
| 395 |
+
"Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (22.0)\n",
|
| 396 |
"Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (1.23.5)\n",
|
| 397 |
+
"Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (3.0.12)\n",
|
| 398 |
"Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (5.3.1)\n",
|
| 399 |
"Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (2.28.1)\n",
|
| 400 |
+
"Requirement already satisfied: regex!=2019.12.17 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (2022.10.31)\n",
|
| 401 |
"Requirement already satisfied: tqdm>=4.27 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (4.64.1)\n",
|
|
|
|
| 402 |
"Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0,>=0.10.0->transformers==4.26.0.dev0) (4.4.0)\n",
|
|
|
|
|
|
|
|
|
|
| 403 |
"Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (2.1.1)\n",
|
| 404 |
+
"Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2.8)\n",
|
| 405 |
+
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2019.11.28)\n",
|
| 406 |
+
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (1.26.13)\n",
|
| 407 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 408 |
"Requirement already satisfied: librosa in ./.local/lib/python3.8/site-packages (0.9.2)\n",
|
| 409 |
+
"Requirement already satisfied: scikit-learn>=0.19.1 in /usr/lib/python3/dist-packages (from librosa) (0.22.2.post1)\n",
|
| 410 |
"Requirement already satisfied: joblib>=0.14 in ./.local/lib/python3.8/site-packages (from librosa) (1.2.0)\n",
|
| 411 |
+
"Requirement already satisfied: soundfile>=0.10.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.11.0)\n",
|
| 412 |
+
"Requirement already satisfied: numpy>=1.17.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.23.5)\n",
|
| 413 |
+
"Requirement already satisfied: pooch>=1.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.6.0)\n",
|
| 414 |
"Requirement already satisfied: decorator>=4.0.10 in /usr/lib/python3/dist-packages (from librosa) (4.4.2)\n",
|
|
|
|
|
|
|
| 415 |
"Requirement already satisfied: audioread>=2.1.9 in ./.local/lib/python3.8/site-packages (from librosa) (3.0.0)\n",
|
| 416 |
+
"Requirement already satisfied: numba>=0.45.1 in ./.local/lib/python3.8/site-packages (from librosa) (0.56.4)\n",
|
| 417 |
+
"Requirement already satisfied: scipy>=1.2.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.9.3)\n",
|
| 418 |
"Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from librosa) (22.0)\n",
|
|
|
|
|
|
|
| 419 |
"Requirement already satisfied: resampy>=0.2.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.4.2)\n",
|
|
|
|
| 420 |
"Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from numba>=0.45.1->librosa) (45.2.0)\n",
|
|
|
|
| 421 |
"Requirement already satisfied: llvmlite<0.40,>=0.39.0dev0 in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (0.39.1)\n",
|
| 422 |
+
"Requirement already satisfied: importlib-metadata in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (5.0.0)\n",
|
| 423 |
"Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from pooch>=1.0->librosa) (2.28.1)\n",
|
| 424 |
+
"Requirement already satisfied: appdirs>=1.3.0 in /usr/lib/python3/dist-packages (from pooch>=1.0->librosa) (1.4.3)\n",
|
| 425 |
"Requirement already satisfied: cffi>=1.0 in /usr/lib/python3/dist-packages (from soundfile>=0.10.2->librosa) (1.14.0)\n",
|
|
|
|
| 426 |
"Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2019.11.28)\n",
|
|
|
|
| 427 |
"Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.8)\n",
|
| 428 |
+
"Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.1.1)\n",
|
| 429 |
+
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (1.26.13)\n",
|
| 430 |
"Requirement already satisfied: zipp>=0.5 in /usr/lib/python3/dist-packages (from importlib-metadata->numba>=0.45.1->librosa) (1.0.0)\n",
|
| 431 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 432 |
"Requirement already satisfied: jiwer in ./.local/lib/python3.8/site-packages (2.5.1)\n",
|
|
|
|
| 434 |
"Requirement already satisfied: rapidfuzz<3.0.0,>=2.3.0 in ./.local/lib/python3.8/site-packages (from levenshtein==0.20.2->jiwer) (2.13.6)\n",
|
| 435 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
| 436 |
"Requirement already satisfied: gradio in ./.local/lib/python3.8/site-packages (3.13.0)\n",
|
| 437 |
+
"Requirement already satisfied: pyyaml in /usr/lib/python3/dist-packages (from gradio) (5.3.1)\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
| 438 |
"Requirement already satisfied: aiohttp in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
|
|
|
|
|
|
|
|
|
|
| 439 |
"Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from gradio) (1.5.1)\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 440 |
"Requirement already satisfied: pydub in ./.local/lib/python3.8/site-packages (from gradio) (0.25.1)\n",
|
| 441 |
+
"Requirement already satisfied: websockets>=10.0 in ./.local/lib/python3.8/site-packages (from gradio) (10.4)\n",
|
| 442 |
+
"Requirement already satisfied: httpx in ./.local/lib/python3.8/site-packages (from gradio) (0.23.1)\n",
|
| 443 |
+
"Requirement already satisfied: pillow in /usr/lib/python3/dist-packages (from gradio) (7.0.0)\n",
|
| 444 |
+
"Requirement already satisfied: uvicorn in ./.local/lib/python3.8/site-packages (from gradio) (0.20.0)\n",
|
| 445 |
+
"Requirement already satisfied: paramiko in ./.local/lib/python3.8/site-packages (from gradio) (2.12.0)\n",
|
| 446 |
+
"Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from gradio) (1.23.5)\n",
|
| 447 |
"Requirement already satisfied: h11<0.13,>=0.11 in ./.local/lib/python3.8/site-packages (from gradio) (0.12.0)\n",
|
|
|
|
| 448 |
"Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from gradio) (2.28.1)\n",
|
| 449 |
+
"Requirement already satisfied: fsspec in ./.local/lib/python3.8/site-packages (from gradio) (2022.11.0)\n",
|
| 450 |
+
"Requirement already satisfied: orjson in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
|
| 451 |
+
"Requirement already satisfied: python-multipart in ./.local/lib/python3.8/site-packages (from gradio) (0.0.5)\n",
|
| 452 |
+
"Requirement already satisfied: pydantic in ./.local/lib/python3.8/site-packages (from gradio) (1.10.2)\n",
|
| 453 |
+
"Requirement already satisfied: markdown-it-py[linkify,plugins] in ./.local/lib/python3.8/site-packages (from gradio) (2.1.0)\n",
|
| 454 |
+
"Requirement already satisfied: ffmpy in ./.local/lib/python3.8/site-packages (from gradio) (0.3.0)\n",
|
| 455 |
+
"Requirement already satisfied: fastapi in ./.local/lib/python3.8/site-packages (from gradio) (0.88.0)\n",
|
| 456 |
+
"Requirement already satisfied: jinja2 in ./.local/lib/python3.8/site-packages (from gradio) (3.1.2)\n",
|
| 457 |
+
"Requirement already satisfied: matplotlib in ./.local/lib/python3.8/site-packages (from gradio) (3.5.3)\n",
|
| 458 |
"Requirement already satisfied: pycryptodome in ./.local/lib/python3.8/site-packages (from gradio) (3.16.0)\n",
|
| 459 |
+
"Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.1)\n",
|
| 460 |
+
"Requirement already satisfied: multidict<7.0,>=4.5 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (6.0.3)\n",
|
|
|
|
| 461 |
"Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.3)\n",
|
| 462 |
"Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->gradio) (19.3.0)\n",
|
| 463 |
+
"Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (4.0.2)\n",
|
| 464 |
+
"Requirement already satisfied: charset-normalizer<3.0,>=2.0 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (2.1.1)\n",
|
| 465 |
"Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.8.2)\n",
|
|
|
|
| 466 |
"Requirement already satisfied: starlette==0.22.0 in ./.local/lib/python3.8/site-packages (from fastapi->gradio) (0.22.0)\n",
|
| 467 |
"Requirement already satisfied: typing-extensions>=3.10.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (4.4.0)\n",
|
| 468 |
"Requirement already satisfied: anyio<5,>=3.4.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (3.6.2)\n",
|
|
|
|
|
|
|
| 469 |
"Requirement already satisfied: rfc3986[idna2008]<2,>=1.3 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.5.0)\n",
|
| 470 |
"Requirement already satisfied: sniffio in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.3.0)\n",
|
| 471 |
+
"Requirement already satisfied: certifi in /usr/lib/python3/dist-packages (from httpx->gradio) (2019.11.28)\n",
|
| 472 |
+
"Requirement already satisfied: httpcore<0.17.0,>=0.15.0 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (0.15.0)\n",
|
| 473 |
"Requirement already satisfied: MarkupSafe>=2.0 in ./.local/lib/python3.8/site-packages (from jinja2->gradio) (2.1.1)\n",
|
| 474 |
"Requirement already satisfied: mdurl~=0.1 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.1.2)\n",
|
|
|
|
| 475 |
"Requirement already satisfied: linkify-it-py~=1.0 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (1.0.3)\n",
|
| 476 |
+
"Requirement already satisfied: mdit-py-plugins in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.3.3)\n",
|
| 477 |
+
"Requirement already satisfied: python-dateutil>=2.7 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (2.8.2)\n",
|
| 478 |
"Requirement already satisfied: kiwisolver>=1.0.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (1.0.1)\n",
|
|
|
|
| 479 |
"Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (22.0)\n",
|
|
|
|
| 480 |
"Requirement already satisfied: cycler>=0.10 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (0.10.0)\n",
|
| 481 |
+
"Requirement already satisfied: pyparsing>=2.2.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (2.4.6)\n",
|
| 482 |
+
"Requirement already satisfied: fonttools>=4.22.0 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (4.38.0)\n",
|
| 483 |
"Requirement already satisfied: pytz>=2020.1 in ./.local/lib/python3.8/site-packages (from pandas->gradio) (2022.5)\n",
|
| 484 |
+
"Requirement already satisfied: bcrypt>=3.1.3 in ./.local/lib/python3.8/site-packages (from paramiko->gradio) (4.0.1)\n",
|
| 485 |
"Requirement already satisfied: six in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.14.0)\n",
|
| 486 |
"Requirement already satisfied: pynacl>=1.0.1 in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.3.0)\n",
|
|
|
|
| 487 |
"Requirement already satisfied: cryptography>=2.5 in /usr/lib/python3/dist-packages (from paramiko->gradio) (2.8)\n",
|
|
|
|
| 488 |
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->gradio) (1.26.13)\n",
|
| 489 |
+
"Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->gradio) (2.8)\n",
|
| 490 |
"Requirement already satisfied: click>=7.0 in /usr/lib/python3/dist-packages (from uvicorn->gradio) (7.0)\n",
|
| 491 |
"Requirement already satisfied: uc-micro-py in ./.local/lib/python3.8/site-packages (from linkify-it-py~=1.0->markdown-it-py[linkify,plugins]->gradio) (1.0.1)\n",
|
| 492 |
"Defaulting to user installation because normal site-packages is not writeable\n",
|
|
|
|
| 555 |
{
|
| 556 |
"data": {
|
| 557 |
"application/vnd.jupyter.widget-view+json": {
|
| 558 |
+
"model_id": "ad867c59abb44253a78ca06b8853a84d",
|
| 559 |
"version_major": 2,
|
| 560 |
"version_minor": 0
|
| 561 |
},
|
|
|
|
| 714 |
" all_datasets = []\n",
|
| 715 |
" # iterate over the datasets we want to interleave\n",
|
| 716 |
" for i, dataset_name in enumerate(dataset_names):\n",
|
| 717 |
+
" dataset = load_dataset(dataset_name, dataset_config_names[i], split=splits[i], streaming=False, **kwargs)\n",
|
| 718 |
" # resample to specified sampling rate\n",
|
| 719 |
" dataset = dataset.cast_column(\"audio\", Audio(sampling_rate))\n",
|
| 720 |
" # normalise columns to [\"audio\", \"sentence\"]\n",
|
|
|
|
| 739 |
"id": "qOwlctMhNmCG",
|
| 740 |
"tags": []
|
| 741 |
},
|
| 742 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 743 |
"source": [
|
| 744 |
"ds = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
|
| 745 |
"\n"
|
|
|
|
| 762 |
"metadata": {
|
| 763 |
"id": "imRHJOpm4V_j"
|
| 764 |
},
|
| 765 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 766 |
"source": [
|
| 767 |
"from datasets import IterableDatasetDict\n",
|
| 768 |
"raw_datasets = IterableDatasetDict()\n",
|
| 769 |
"\n",
|
| 770 |
"raw_datasets[\"train\"] = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
|
| 771 |
+
"raw_datasets[\"test\"] = load_dataset(\"mozilla-foundation/common_voice_11_0\", \"el\", split=\"test\", streaming=False, use_auth_token=True)\n",
|
| 772 |
"\n",
|
| 773 |
"\n",
|
| 774 |
"#raw_datasets = raw_datasets.remove_columns([\"accent\", \"age\", \"client_id\", \"down_votes\", \"gender\", \"locale\", \"path\", \"segment\", \"up_votes\"])\n",
|
|
|
|
| 995 |
"metadata": {
|
| 996 |
"id": "a37a7cdb-9013-427f-8de9-6a8d0e9dc684"
|
| 997 |
},
|
| 998 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 999 |
"source": [
|
| 1000 |
"vectorized_datasets = raw_datasets.map(prepare_dataset, remove_columns=list(next(iter(raw_datasets.values())).features)).with_format(\"torch\")"
|
| 1001 |
]
|
|
|
|
| 1012 |
},
|
| 1013 |
{
|
| 1014 |
"cell_type": "code",
|
| 1015 |
+
"execution_count": 17,
|
| 1016 |
"id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c",
|
| 1017 |
"metadata": {
|
| 1018 |
"id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c"
|
| 1019 |
},
|
| 1020 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1021 |
"source": [
|
| 1022 |
"vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].shuffle(\n",
|
| 1023 |
" #buffer_size=500,\n",
|
|
|
|
| 1040 |
},
|
| 1041 |
{
|
| 1042 |
"cell_type": "code",
|
| 1043 |
+
"execution_count": 18,
|
| 1044 |
"id": "01cb25ef-4bb0-4325-9461-f59198acadf6",
|
| 1045 |
"metadata": {
|
| 1046 |
"id": "01cb25ef-4bb0-4325-9461-f59198acadf6"
|
|
|
|
| 1065 |
},
|
| 1066 |
{
|
| 1067 |
"cell_type": "code",
|
| 1068 |
+
"execution_count": 19,
|
| 1069 |
"id": "333f7f6e-6053-4d3b-8924-c733c79b82ac",
|
| 1070 |
"metadata": {
|
| 1071 |
"id": "333f7f6e-6053-4d3b-8924-c733c79b82ac"
|
| 1072 |
},
|
| 1073 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1074 |
"source": [
|
| 1075 |
"vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].filter(\n",
|
| 1076 |
" is_audio_in_length_range,\n",
|
|
|
|
| 1145 |
},
|
| 1146 |
{
|
| 1147 |
"cell_type": "code",
|
| 1148 |
+
"execution_count": 20,
|
| 1149 |
"id": "8326221e-ec13-4731-bb4e-51e5fc1486c5",
|
| 1150 |
"metadata": {
|
| 1151 |
"id": "8326221e-ec13-4731-bb4e-51e5fc1486c5"
|
|
|
|
| 1197 |
},
|
| 1198 |
{
|
| 1199 |
"cell_type": "code",
|
| 1200 |
+
"execution_count": 21,
|
| 1201 |
"id": "fc834702-c0d3-4a96-b101-7b87be32bf42",
|
| 1202 |
"metadata": {
|
| 1203 |
"id": "fc834702-c0d3-4a96-b101-7b87be32bf42"
|
|
|
|
| 1230 |
},
|
| 1231 |
{
|
| 1232 |
"cell_type": "code",
|
| 1233 |
+
"execution_count": 22,
|
| 1234 |
"id": "b22b4011-f31f-4b57-b684-c52332f92890",
|
| 1235 |
"metadata": {
|
| 1236 |
"colab": {
|
|
|
|
| 1281 |
},
|
| 1282 |
{
|
| 1283 |
"cell_type": "code",
|
| 1284 |
+
"execution_count": 23,
|
| 1285 |
"id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb",
|
| 1286 |
"metadata": {
|
| 1287 |
"id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb"
|
|
|
|
| 1330 |
},
|
| 1331 |
{
|
| 1332 |
"cell_type": "code",
|
| 1333 |
+
"execution_count": 24,
|
| 1334 |
"id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
|
| 1335 |
"metadata": {
|
| 1336 |
"colab": {
|
|
|
|
| 1368 |
{
|
| 1369 |
"data": {
|
| 1370 |
"application/vnd.jupyter.widget-view+json": {
|
| 1371 |
+
"model_id": "18e0d00451ec4e10b1cea9b9d3748384",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1372 |
"version_major": 2,
|
| 1373 |
"version_minor": 0
|
| 1374 |
},
|
|
|
|
| 1401 |
},
|
| 1402 |
{
|
| 1403 |
"cell_type": "code",
|
| 1404 |
+
"execution_count": 25,
|
| 1405 |
"id": "62038ba3-88ed-4fce-84db-338f50dcd04f",
|
| 1406 |
"metadata": {
|
| 1407 |
"id": "62038ba3-88ed-4fce-84db-338f50dcd04f"
|
|
|
|
| 1438 |
},
|
| 1439 |
{
|
| 1440 |
"cell_type": "code",
|
| 1441 |
+
"execution_count": 26,
|
| 1442 |
"id": "0ae3e9af-97b7-4aa0-ae85-20b23b5bcb3a",
|
| 1443 |
"metadata": {
|
| 1444 |
"colab": {
|
|
|
|
| 1481 |
},
|
| 1482 |
{
|
| 1483 |
"cell_type": "code",
|
| 1484 |
+
"execution_count": 27,
|
| 1485 |
"id": "o72eOpGzD_sK",
|
| 1486 |
"metadata": {
|
| 1487 |
"colab": {
|
|
|
|
| 1495 |
"name": "stdout",
|
| 1496 |
"output_type": "stream",
|
| 1497 |
"text": [
|
| 1498 |
+
"Tue Dec 13 21:29:08 2022 \n",
|
| 1499 |
"+-----------------------------------------------------------------------------+\n",
|
| 1500 |
"| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
|
| 1501 |
"|-------------------------------+----------------------+----------------------+\n",
|
|
|
|
| 1504 |
"| | | MIG M. |\n",
|
| 1505 |
"|===============================+======================+======================|\n",
|
| 1506 |
"| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
|
| 1507 |
+
"| N/A 32C P0 47W / 400W | 2MiB / 40960MiB | 0% Default |\n",
|
| 1508 |
"| | | Disabled |\n",
|
| 1509 |
"+-------------------------------+----------------------+----------------------+\n",
|
| 1510 |
" \n",
|
|
|
|
| 1545 |
},
|
| 1546 |
{
|
| 1547 |
"cell_type": "code",
|
| 1548 |
+
"execution_count": 28,
|
| 1549 |
"id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2",
|
| 1550 |
"metadata": {
|
| 1551 |
"id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2"
|
|
|
|
| 1578 |
},
|
| 1579 |
{
|
| 1580 |
"cell_type": "code",
|
| 1581 |
+
"execution_count": 29,
|
| 1582 |
"id": "d546d7fe-0543-479a-b708-2ebabec19493",
|
| 1583 |
"metadata": {
|
| 1584 |
"colab": {
|
|
|
|
| 2192 |
},
|
| 2193 |
{
|
| 2194 |
"cell_type": "code",
|
| 2195 |
+
"execution_count": 30,
|
| 2196 |
"id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672",
|
| 2197 |
"metadata": {
|
| 2198 |
"id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672"
|
|
|
|
| 2285 |
"name": "stderr",
|
| 2286 |
"output_type": "stream",
|
| 2287 |
"text": [
|
| 2288 |
+
"Loading model from ./whisper-medium-el/checkpoint-4000.\n",
|
|
|
|
| 2289 |
"/home/ubuntu/.local/lib/python3.8/site-packages/transformers/optimization.py:306: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
|
| 2290 |
" warnings.warn(\n",
|
| 2291 |
"***** Running training *****\n",
|
| 2292 |
+
" Num examples = 160000\n",
|
| 2293 |
+
" Num Epochs = 9223372036854775807\n",
|
| 2294 |
" Instantaneous batch size per device = 32\n",
|
| 2295 |
" Total train batch size (w. parallel, distributed & accumulation) = 32\n",
|
| 2296 |
" Gradient Accumulation steps = 1\n",
|
| 2297 |
" Total optimization steps = 5000\n",
|
| 2298 |
" Number of trainable parameters = 763857920\n",
|
| 2299 |
" Continuing training from checkpoint, will skip to saved global_step\n",
|
| 2300 |
+
" Continuing training from epoch 0\n",
|
| 2301 |
+
" Continuing training from global step 4000\n",
|
| 2302 |
+
"Reading metadata...: 1914it [00:00, 4074.06it/s]\n",
|
| 2303 |
+
"The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
|
| 2304 |
]
|
| 2305 |
},
|
| 2306 |
{
|
|
|
|
| 2309 |
"\n",
|
| 2310 |
" <div>\n",
|
| 2311 |
" \n",
|
| 2312 |
+
" <progress value='4012' max='5000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
|
| 2313 |
+
" [4012/5000 01:11 < 1:57:29, 0.14 it/s, Epoch 0.00/9223372036854775807]\n",
|
| 2314 |
" </div>\n",
|
| 2315 |
" <table border=\"1\" class=\"dataframe\">\n",
|
| 2316 |
" <thead>\n",
|
|
|
|
| 2318 |
" <th>Step</th>\n",
|
| 2319 |
" <th>Training Loss</th>\n",
|
| 2320 |
" <th>Validation Loss</th>\n",
|
|
|
|
| 2321 |
" </tr>\n",
|
| 2322 |
" </thead>\n",
|
| 2323 |
" <tbody>\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2324 |
" </tbody>\n",
|
| 2325 |
"</table><p>"
|
| 2326 |
],
|
|
|
|
| 2330 |
},
|
| 2331 |
"metadata": {},
|
| 2332 |
"output_type": "display_data"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2333 |
}
|
| 2334 |
],
|
| 2335 |
"source": [
|
e5_interleaving-resume.ipynb
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3055754841
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f7fdd05661053c2949f2de6138c02cb1fe501fbe43efcf806797c3e43cbf808
|
| 3 |
size 3055754841
|
runs/Dec13_21-29-08_129-146-102-49/1670966960.518305/events.out.tfevents.1670966960.129-146-102-49.882304.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:652c159c0a7bbc04d6c208c74e4668602cb677b0fc2d296735cd23cd3d391b2b
|
| 3 |
+
size 5916
|
runs/Dec13_21-29-08_129-146-102-49/events.out.tfevents.1670966960.129-146-102-49.882304.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c6d5d76a7999c988e99742cae5b57c5aa438dc6403c604611d0c8fd18754328
|
| 3 |
+
size 5603
|
runs/Dec13_21-57-38_129-146-102-49/1670968669.9597044/events.out.tfevents.1670968669.129-146-102-49.882304.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8668bd5e2470303db22eb81688526a881371c3506fdfeed7a6b32abc5192a1e
|
| 3 |
+
size 5916
|
runs/Dec13_21-57-38_129-146-102-49/events.out.tfevents.1670968669.129-146-102-49.882304.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37a61ed2fa7d6d2ac64d6e063e35f8b5541406347236af61ace7e3f08422daea
|
| 3 |
+
size 4348
|
runs/Dec13_22-18-00_129-146-102-49/1670969892.775061/events.out.tfevents.1670969892.129-146-102-49.1014402.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51450fedd70a8ed8e04dbdda335b86fff15a62346527cf67bef861a20bf39cde
|
| 3 |
+
size 5916
|
runs/Dec13_22-18-00_129-146-102-49/1670995449.379962/events.out.tfevents.1670995449.129-146-102-49.1014402.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9ad24d679255e97efd512a0e6ec44b3d1b3f9d6b9fd69a929d4f4b65635093f
|
| 3 |
+
size 5916
|
runs/Dec13_22-18-00_129-146-102-49/events.out.tfevents.1670969892.129-146-102-49.1014402.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af928d9b3e795892da6df5ac604d6bb4c9799d8fbae2048212044a62e879c0fc
|
| 3 |
+
size 15254
|
runs/Dec14_05-46-08_129-146-102-49/1670996781.2697837/events.out.tfevents.1670996781.129-146-102-49.1113148.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1b3e632cba6fe6e654853b87efedea97668491d8e6906fb42ebf1c6b1f013cc
|
| 3 |
+
size 5916
|
runs/Dec14_05-46-08_129-146-102-49/events.out.tfevents.1670996781.129-146-102-49.1113148.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:243ca82c57c99466d5246efd3eb4dd017e04c059b7b31d2befe0ea6f22a39214
|
| 3 |
+
size 10946
|
runs/Dec14_09-33-49_129-146-102-49/1671010439.939292/events.out.tfevents.1671010439.129-146-102-49.1212260.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a3fea8291dc179c7503abc25f7377b71002351df3b2639e4e6228b997b64d90
|
| 3 |
+
size 5916
|
runs/Dec14_09-33-49_129-146-102-49/events.out.tfevents.1671010439.129-146-102-49.1212260.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ccb9309b9bb866e6e16f7627e4a4b88a932cd62d0f847514e94d0e2208d3716
|
| 3 |
+
size 4347
|
runs/Dec14_10-24-09_129-146-102-49/1671013461.8981154/events.out.tfevents.1671013461.129-146-102-49.1508853.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af188c00a280a385bf7ede8ce3aea5fdf554d81e0aa7cab21884c04bcf42eb5e
|
| 3 |
+
size 5916
|
runs/Dec14_10-24-09_129-146-102-49/events.out.tfevents.1671013461.129-146-102-49.1508853.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b10f8350f1923948412c9c14188fa5cb649b2bf9081f63941e3fcf5ba378701a
|
| 3 |
+
size 10945
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3643
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eeadae68908ede5e3241ff2195c01ad92b5ee3a7db47d3a44b664270809ad8db
|
| 3 |
size 3643
|