Training in progress, step 2000
Browse files- asr.ipynb +19 -235
- generation_config.json +263 -0
- model.safetensors +1 -1
- runs/Dec07_01-11-40_smurf/events.out.tfevents.1701904301.smurf.965337.0 +3 -0
- training_args.bin +1 -1
asr.ipynb
CHANGED
|
@@ -5,17 +5,10 @@
|
|
| 5 |
"execution_count": 1,
|
| 6 |
"metadata": {},
|
| 7 |
"outputs": [
|
| 8 |
-
{
|
| 9 |
-
"name": "stdout",
|
| 10 |
-
"output_type": "stream",
|
| 11 |
-
"text": [
|
| 12 |
-
"The history saving thread hit an unexpected error (OperationalError('disk I/O error')).History will not be written to the database.\n"
|
| 13 |
-
]
|
| 14 |
-
},
|
| 15 |
{
|
| 16 |
"data": {
|
| 17 |
"application/vnd.jupyter.widget-view+json": {
|
| 18 |
-
"model_id": "
|
| 19 |
"version_major": 2,
|
| 20 |
"version_minor": 0
|
| 21 |
},
|
|
@@ -370,16 +363,16 @@
|
|
| 370 |
},
|
| 371 |
{
|
| 372 |
"cell_type": "code",
|
| 373 |
-
"execution_count":
|
| 374 |
"metadata": {},
|
| 375 |
"outputs": [],
|
| 376 |
"source": [
|
| 377 |
"from transformers import Seq2SeqTrainingArguments\n",
|
| 378 |
"\n",
|
| 379 |
"training_args = Seq2SeqTrainingArguments(\n",
|
| 380 |
-
" output_dir=\"./\", # change to a repo name of your choice\n",
|
| 381 |
" per_device_train_batch_size=4,\n",
|
| 382 |
-
" gradient_accumulation_steps=
|
| 383 |
" learning_rate=1e-5,\n",
|
| 384 |
" warmup_steps=500,\n",
|
| 385 |
" max_steps=1000,\n",
|
|
@@ -389,8 +382,8 @@
|
|
| 389 |
" per_device_eval_batch_size=2,\n",
|
| 390 |
" predict_with_generate=True,\n",
|
| 391 |
" generation_max_length=225,\n",
|
| 392 |
-
" save_steps=
|
| 393 |
-
" eval_steps=
|
| 394 |
" logging_steps=25,\n",
|
| 395 |
" report_to=[\"tensorboard\"],\n",
|
| 396 |
" load_best_model_at_end=True,\n",
|
|
@@ -402,7 +395,7 @@
|
|
| 402 |
},
|
| 403 |
{
|
| 404 |
"cell_type": "code",
|
| 405 |
-
"execution_count":
|
| 406 |
"metadata": {},
|
| 407 |
"outputs": [],
|
| 408 |
"source": [
|
|
@@ -421,25 +414,24 @@
|
|
| 421 |
},
|
| 422 |
{
|
| 423 |
"cell_type": "code",
|
| 424 |
-
"execution_count":
|
| 425 |
"metadata": {},
|
| 426 |
"outputs": [
|
| 427 |
{
|
| 428 |
"ename": "ValueError",
|
| 429 |
-
"evalue": "
|
| 430 |
"output_type": "error",
|
| 431 |
"traceback": [
|
| 432 |
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
| 433 |
"\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)",
|
| 434 |
-
"\u001b[1;32m/u/11/zhangz13/unix/zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/asr.ipynb Cell 19\u001b[0m line \u001b[0;36m1\n\u001b[0;32m----> <a href='vscode-notebook-cell://ssh-remote%
|
| 435 |
-
"File \u001b[0;32m~/.conda/envs/id23/lib/python3.8/site-packages/transformers/trainer.py:
|
| 436 |
-
"
|
| 437 |
-
"\u001b[0;31mValueError\u001b[0m: Can't find a valid checkpoint at ./checkpoint-800"
|
| 438 |
]
|
| 439 |
}
|
| 440 |
],
|
| 441 |
"source": [
|
| 442 |
-
"trainer.train(resume_from_checkpoint=
|
| 443 |
]
|
| 444 |
},
|
| 445 |
{
|
|
@@ -447,99 +439,6 @@
|
|
| 447 |
"execution_count": null,
|
| 448 |
"metadata": {},
|
| 449 |
"outputs": [],
|
| 450 |
-
"source": []
|
| 451 |
-
},
|
| 452 |
-
{
|
| 453 |
-
"cell_type": "code",
|
| 454 |
-
"execution_count": 38,
|
| 455 |
-
"metadata": {},
|
| 456 |
-
"outputs": [
|
| 457 |
-
{
|
| 458 |
-
"data": {
|
| 459 |
-
"text/plain": [
|
| 460 |
-
"('whisper-small-hi/tokenizer_config.json',\n",
|
| 461 |
-
" 'whisper-small-hi/special_tokens_map.json',\n",
|
| 462 |
-
" 'whisper-small-hi/vocab.json',\n",
|
| 463 |
-
" 'whisper-small-hi/merges.txt',\n",
|
| 464 |
-
" 'whisper-small-hi/normalizer.json',\n",
|
| 465 |
-
" 'whisper-small-hi/added_tokens.json')"
|
| 466 |
-
]
|
| 467 |
-
},
|
| 468 |
-
"execution_count": 38,
|
| 469 |
-
"metadata": {},
|
| 470 |
-
"output_type": "execute_result"
|
| 471 |
-
}
|
| 472 |
-
],
|
| 473 |
-
"source": [
|
| 474 |
-
"save_directory = 'zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/whisper-small-hi'\n",
|
| 475 |
-
"tokenizer.save_pretrained('whisper-small-hi')"
|
| 476 |
-
]
|
| 477 |
-
},
|
| 478 |
-
{
|
| 479 |
-
"cell_type": "code",
|
| 480 |
-
"execution_count": null,
|
| 481 |
-
"metadata": {},
|
| 482 |
-
"outputs": [],
|
| 483 |
-
"source": []
|
| 484 |
-
},
|
| 485 |
-
{
|
| 486 |
-
"cell_type": "code",
|
| 487 |
-
"execution_count": 20,
|
| 488 |
-
"metadata": {},
|
| 489 |
-
"outputs": [
|
| 490 |
-
{
|
| 491 |
-
"data": {
|
| 492 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 493 |
-
"model_id": "84635a07e5714975a3b3e597745d4475",
|
| 494 |
-
"version_major": 2,
|
| 495 |
-
"version_minor": 0
|
| 496 |
-
},
|
| 497 |
-
"text/plain": [
|
| 498 |
-
"model.safetensors: 0%| | 0.00/967M [00:00<?, ?B/s]"
|
| 499 |
-
]
|
| 500 |
-
},
|
| 501 |
-
"metadata": {},
|
| 502 |
-
"output_type": "display_data"
|
| 503 |
-
},
|
| 504 |
-
{
|
| 505 |
-
"data": {
|
| 506 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 507 |
-
"model_id": "b452f2feb12346cfb790a8503ddcf338",
|
| 508 |
-
"version_major": 2,
|
| 509 |
-
"version_minor": 0
|
| 510 |
-
},
|
| 511 |
-
"text/plain": [
|
| 512 |
-
"Upload 2 LFS files: 0%| | 0/2 [00:00<?, ?it/s]"
|
| 513 |
-
]
|
| 514 |
-
},
|
| 515 |
-
"metadata": {},
|
| 516 |
-
"output_type": "display_data"
|
| 517 |
-
},
|
| 518 |
-
{
|
| 519 |
-
"data": {
|
| 520 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 521 |
-
"model_id": "30ea510a97454ff1bbb2cb3ad89e6a5e",
|
| 522 |
-
"version_major": 2,
|
| 523 |
-
"version_minor": 0
|
| 524 |
-
},
|
| 525 |
-
"text/plain": [
|
| 526 |
-
"training_args.bin: 0%| | 0.00/4.73k [00:00<?, ?B/s]"
|
| 527 |
-
]
|
| 528 |
-
},
|
| 529 |
-
"metadata": {},
|
| 530 |
-
"output_type": "display_data"
|
| 531 |
-
},
|
| 532 |
-
{
|
| 533 |
-
"data": {
|
| 534 |
-
"text/plain": [
|
| 535 |
-
"'https://huggingface.co/Zipei-KTH/whisper-small-hi/tree/main/'"
|
| 536 |
-
]
|
| 537 |
-
},
|
| 538 |
-
"execution_count": 20,
|
| 539 |
-
"metadata": {},
|
| 540 |
-
"output_type": "execute_result"
|
| 541 |
-
}
|
| 542 |
-
],
|
| 543 |
"source": [
|
| 544 |
"kwargs = {\n",
|
| 545 |
" \"dataset_tags\": \"mozilla-foundation/common_voice_11_0\",\n",
|
|
@@ -559,129 +458,14 @@
|
|
| 559 |
},
|
| 560 |
{
|
| 561 |
"cell_type": "code",
|
| 562 |
-
"execution_count":
|
| 563 |
"metadata": {},
|
| 564 |
-
"outputs": [
|
| 565 |
-
{
|
| 566 |
-
"data": {
|
| 567 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 568 |
-
"model_id": "42153c06c029428e965a889029e38309",
|
| 569 |
-
"version_major": 2,
|
| 570 |
-
"version_minor": 0
|
| 571 |
-
},
|
| 572 |
-
"text/plain": [
|
| 573 |
-
"model.safetensors: 0%| | 0.00/967M [00:00<?, ?B/s]"
|
| 574 |
-
]
|
| 575 |
-
},
|
| 576 |
-
"metadata": {},
|
| 577 |
-
"output_type": "display_data"
|
| 578 |
-
},
|
| 579 |
-
{
|
| 580 |
-
"data": {
|
| 581 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 582 |
-
"model_id": "eb251857ff3d4ab18e5c58e82735d97d",
|
| 583 |
-
"version_major": 2,
|
| 584 |
-
"version_minor": 0
|
| 585 |
-
},
|
| 586 |
-
"text/plain": [
|
| 587 |
-
"preprocessor_config.json: 0%| | 0.00/339 [00:00<?, ?B/s]"
|
| 588 |
-
]
|
| 589 |
-
},
|
| 590 |
-
"metadata": {},
|
| 591 |
-
"output_type": "display_data"
|
| 592 |
-
},
|
| 593 |
-
{
|
| 594 |
-
"data": {
|
| 595 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 596 |
-
"model_id": "84d90e9074864b3ab818e6293595882e",
|
| 597 |
-
"version_major": 2,
|
| 598 |
-
"version_minor": 0
|
| 599 |
-
},
|
| 600 |
-
"text/plain": [
|
| 601 |
-
"tokenizer_config.json: 0%| | 0.00/283k [00:00<?, ?B/s]"
|
| 602 |
-
]
|
| 603 |
-
},
|
| 604 |
-
"metadata": {},
|
| 605 |
-
"output_type": "display_data"
|
| 606 |
-
},
|
| 607 |
-
{
|
| 608 |
-
"data": {
|
| 609 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 610 |
-
"model_id": "ea9fda628bb44dadadc000213fe5ee03",
|
| 611 |
-
"version_major": 2,
|
| 612 |
-
"version_minor": 0
|
| 613 |
-
},
|
| 614 |
-
"text/plain": [
|
| 615 |
-
"vocab.json: 0%| | 0.00/1.04M [00:00<?, ?B/s]"
|
| 616 |
-
]
|
| 617 |
-
},
|
| 618 |
-
"metadata": {},
|
| 619 |
-
"output_type": "display_data"
|
| 620 |
-
},
|
| 621 |
-
{
|
| 622 |
-
"data": {
|
| 623 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 624 |
-
"model_id": "8d6eb5580e334be6aadc646e59f467b1",
|
| 625 |
-
"version_major": 2,
|
| 626 |
-
"version_minor": 0
|
| 627 |
-
},
|
| 628 |
-
"text/plain": [
|
| 629 |
-
"normalizer.json: 0%| | 0.00/52.7k [00:00<?, ?B/s]"
|
| 630 |
-
]
|
| 631 |
-
},
|
| 632 |
-
"metadata": {},
|
| 633 |
-
"output_type": "display_data"
|
| 634 |
-
},
|
| 635 |
-
{
|
| 636 |
-
"data": {
|
| 637 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 638 |
-
"model_id": "68286349166b4fd4bfba369fb8e9540a",
|
| 639 |
-
"version_major": 2,
|
| 640 |
-
"version_minor": 0
|
| 641 |
-
},
|
| 642 |
-
"text/plain": [
|
| 643 |
-
"added_tokens.json: 0%| | 0.00/34.6k [00:00<?, ?B/s]"
|
| 644 |
-
]
|
| 645 |
-
},
|
| 646 |
-
"metadata": {},
|
| 647 |
-
"output_type": "display_data"
|
| 648 |
-
},
|
| 649 |
-
{
|
| 650 |
-
"data": {
|
| 651 |
-
"application/vnd.jupyter.widget-view+json": {
|
| 652 |
-
"model_id": "86bd824130ab4f85af758b62f365f739",
|
| 653 |
-
"version_major": 2,
|
| 654 |
-
"version_minor": 0
|
| 655 |
-
},
|
| 656 |
-
"text/plain": [
|
| 657 |
-
"special_tokens_map.json: 0%| | 0.00/2.19k [00:00<?, ?B/s]"
|
| 658 |
-
]
|
| 659 |
-
},
|
| 660 |
-
"metadata": {},
|
| 661 |
-
"output_type": "display_data"
|
| 662 |
-
},
|
| 663 |
-
{
|
| 664 |
-
"ename": "TypeError",
|
| 665 |
-
"evalue": "expected str, bytes or os.PathLike object, not NoneType",
|
| 666 |
-
"output_type": "error",
|
| 667 |
-
"traceback": [
|
| 668 |
-
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
| 669 |
-
"\u001b[0;31mTypeError\u001b[0m Traceback (most recent call last)",
|
| 670 |
-
"\u001b[1;32m/u/11/zhangz13/unix/zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/whisper-small-hi/asr.ipynb Cell 24\u001b[0m line \u001b[0;36m4\n\u001b[1;32m <a href='vscode-notebook-cell://ssh-remote%2Bwake/u/11/zhangz13/unix/zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/whisper-small-hi/asr.ipynb#X32sdnNjb2RlLXJlbW90ZQ%3D%3D?line=0'>1</a>\u001b[0m \u001b[39mfrom\u001b[39;00m \u001b[39mtransformers\u001b[39;00m \u001b[39mimport\u001b[39;00m WhisperForConditionalGeneration, WhisperProcessor\n\u001b[1;32m <a href='vscode-notebook-cell://ssh-remote%2Bwake/u/11/zhangz13/unix/zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/whisper-small-hi/asr.ipynb#X32sdnNjb2RlLXJlbW90ZQ%3D%3D?line=2'>3</a>\u001b[0m model \u001b[39m=\u001b[39m WhisperForConditionalGeneration\u001b[39m.\u001b[39mfrom_pretrained(\u001b[39m\"\u001b[39m\u001b[39mZipei-KTH/whisper_hi_test\u001b[39m\u001b[39m\"\u001b[39m)\n\u001b[0;32m----> <a href='vscode-notebook-cell://ssh-remote%2Bwake/u/11/zhangz13/unix/zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/whisper-small-hi/asr.ipynb#X32sdnNjb2RlLXJlbW90ZQ%3D%3D?line=3'>4</a>\u001b[0m processor \u001b[39m=\u001b[39m WhisperProcessor\u001b[39m.\u001b[39;49mfrom_pretrained(\u001b[39m\"\u001b[39;49m\u001b[39mZipei-KTH/whisper_hi_test\u001b[39;49m\u001b[39m\"\u001b[39;49m)\n",
|
| 671 |
-
"File \u001b[0;32m~/.conda/envs/id23/lib/python3.8/site-packages/transformers/processing_utils.py:228\u001b[0m, in \u001b[0;36mProcessorMixin.from_pretrained\u001b[0;34m(cls, pretrained_model_name_or_path, cache_dir, force_download, local_files_only, token, revision, **kwargs)\u001b[0m\n\u001b[1;32m 225\u001b[0m \u001b[39mif\u001b[39;00m token \u001b[39mis\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mNone\u001b[39;00m:\n\u001b[1;32m 226\u001b[0m kwargs[\u001b[39m\"\u001b[39m\u001b[39mtoken\u001b[39m\u001b[39m\"\u001b[39m] \u001b[39m=\u001b[39m token\n\u001b[0;32m--> 228\u001b[0m args \u001b[39m=\u001b[39m \u001b[39mcls\u001b[39;49m\u001b[39m.\u001b[39;49m_get_arguments_from_pretrained(pretrained_model_name_or_path, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m 229\u001b[0m \u001b[39mreturn\u001b[39;00m \u001b[39mcls\u001b[39m(\u001b[39m*\u001b[39margs)\n",
|
| 672 |
-
"File \u001b[0;32m~/.conda/envs/id23/lib/python3.8/site-packages/transformers/processing_utils.py:272\u001b[0m, in \u001b[0;36mProcessorMixin._get_arguments_from_pretrained\u001b[0;34m(cls, pretrained_model_name_or_path, **kwargs)\u001b[0m\n\u001b[1;32m 269\u001b[0m \u001b[39melse\u001b[39;00m:\n\u001b[1;32m 270\u001b[0m attribute_class \u001b[39m=\u001b[39m \u001b[39mgetattr\u001b[39m(transformers_module, class_name)\n\u001b[0;32m--> 272\u001b[0m args\u001b[39m.\u001b[39mappend(attribute_class\u001b[39m.\u001b[39;49mfrom_pretrained(pretrained_model_name_or_path, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs))\n\u001b[1;32m 273\u001b[0m \u001b[39mreturn\u001b[39;00m args\n",
|
| 673 |
-
"File \u001b[0;32m~/.conda/envs/id23/lib/python3.8/site-packages/transformers/tokenization_utils_base.py:2024\u001b[0m, in \u001b[0;36mPreTrainedTokenizerBase.from_pretrained\u001b[0;34m(cls, pretrained_model_name_or_path, cache_dir, force_download, local_files_only, token, revision, *init_inputs, **kwargs)\u001b[0m\n\u001b[1;32m 2021\u001b[0m \u001b[39melse\u001b[39;00m:\n\u001b[1;32m 2022\u001b[0m logger\u001b[39m.\u001b[39minfo(\u001b[39mf\u001b[39m\u001b[39m\"\u001b[39m\u001b[39mloading file \u001b[39m\u001b[39m{\u001b[39;00mfile_path\u001b[39m}\u001b[39;00m\u001b[39m from cache at \u001b[39m\u001b[39m{\u001b[39;00mresolved_vocab_files[file_id]\u001b[39m}\u001b[39;00m\u001b[39m\"\u001b[39m)\n\u001b[0;32m-> 2024\u001b[0m \u001b[39mreturn\u001b[39;00m \u001b[39mcls\u001b[39;49m\u001b[39m.\u001b[39;49m_from_pretrained(\n\u001b[1;32m 2025\u001b[0m resolved_vocab_files,\n\u001b[1;32m 2026\u001b[0m pretrained_model_name_or_path,\n\u001b[1;32m 2027\u001b[0m init_configuration,\n\u001b[1;32m 2028\u001b[0m \u001b[39m*\u001b[39;49minit_inputs,\n\u001b[1;32m 2029\u001b[0m token\u001b[39m=\u001b[39;49mtoken,\n\u001b[1;32m 2030\u001b[0m cache_dir\u001b[39m=\u001b[39;49mcache_dir,\n\u001b[1;32m 2031\u001b[0m local_files_only\u001b[39m=\u001b[39;49mlocal_files_only,\n\u001b[1;32m 2032\u001b[0m _commit_hash\u001b[39m=\u001b[39;49mcommit_hash,\n\u001b[1;32m 2033\u001b[0m _is_local\u001b[39m=\u001b[39;49mis_local,\n\u001b[1;32m 2034\u001b[0m \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs,\n\u001b[1;32m 2035\u001b[0m )\n",
|
| 674 |
-
"File \u001b[0;32m~/.conda/envs/id23/lib/python3.8/site-packages/transformers/tokenization_utils_base.py:2256\u001b[0m, in \u001b[0;36mPreTrainedTokenizerBase._from_pretrained\u001b[0;34m(cls, resolved_vocab_files, pretrained_model_name_or_path, init_configuration, token, cache_dir, local_files_only, _commit_hash, _is_local, *init_inputs, **kwargs)\u001b[0m\n\u001b[1;32m 2254\u001b[0m \u001b[39m# Instantiate the tokenizer.\u001b[39;00m\n\u001b[1;32m 2255\u001b[0m \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m-> 2256\u001b[0m tokenizer \u001b[39m=\u001b[39m \u001b[39mcls\u001b[39;49m(\u001b[39m*\u001b[39;49minit_inputs, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49minit_kwargs)\n\u001b[1;32m 2257\u001b[0m \u001b[39mexcept\u001b[39;00m \u001b[39mOSError\u001b[39;00m:\n\u001b[1;32m 2258\u001b[0m \u001b[39mraise\u001b[39;00m \u001b[39mOSError\u001b[39;00m(\n\u001b[1;32m 2259\u001b[0m \u001b[39m\"\u001b[39m\u001b[39mUnable to load vocabulary from file. \u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m 2260\u001b[0m \u001b[39m\"\u001b[39m\u001b[39mPlease check that the provided vocabulary is accessible and not corrupted.\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m 2261\u001b[0m )\n",
|
| 675 |
-
"File \u001b[0;32m~/.conda/envs/id23/lib/python3.8/site-packages/transformers/models/whisper/tokenization_whisper.py:304\u001b[0m, in \u001b[0;36mWhisperTokenizer.__init__\u001b[0;34m(self, vocab_file, merges_file, normalizer_file, errors, unk_token, bos_token, eos_token, pad_token, add_prefix_space, language, task, predict_timestamps, **kwargs)\u001b[0m\n\u001b[1;32m 302\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mbyte_encoder \u001b[39m=\u001b[39m bytes_to_unicode()\n\u001b[1;32m 303\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mbyte_decoder \u001b[39m=\u001b[39m {v: k \u001b[39mfor\u001b[39;00m k, v \u001b[39min\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mbyte_encoder\u001b[39m.\u001b[39mitems()}\n\u001b[0;32m--> 304\u001b[0m \u001b[39mwith\u001b[39;00m \u001b[39mopen\u001b[39;49m(merges_file, encoding\u001b[39m=\u001b[39;49m\u001b[39m\"\u001b[39;49m\u001b[39mutf-8\u001b[39;49m\u001b[39m\"\u001b[39;49m) \u001b[39mas\u001b[39;00m merges_handle:\n\u001b[1;32m 305\u001b[0m bpe_merges \u001b[39m=\u001b[39m merges_handle\u001b[39m.\u001b[39mread()\u001b[39m.\u001b[39msplit(\u001b[39m\"\u001b[39m\u001b[39m\\n\u001b[39;00m\u001b[39m\"\u001b[39m)[\u001b[39m1\u001b[39m:\u001b[39m-\u001b[39m\u001b[39m1\u001b[39m]\n\u001b[1;32m 306\u001b[0m bpe_merges \u001b[39m=\u001b[39m [\u001b[39mtuple\u001b[39m(merge\u001b[39m.\u001b[39msplit()) \u001b[39mfor\u001b[39;00m merge \u001b[39min\u001b[39;00m bpe_merges]\n",
|
| 676 |
-
"\u001b[0;31mTypeError\u001b[0m: expected str, bytes or os.PathLike object, not NoneType"
|
| 677 |
-
]
|
| 678 |
-
}
|
| 679 |
-
],
|
| 680 |
"source": [
|
| 681 |
"from transformers import WhisperForConditionalGeneration, WhisperProcessor\n",
|
| 682 |
"\n",
|
| 683 |
-
"model = WhisperForConditionalGeneration.from_pretrained(\"Zipei-KTH/
|
| 684 |
-
"processor = WhisperProcessor.from_pretrained(\"Zipei-KTH/
|
| 685 |
]
|
| 686 |
},
|
| 687 |
{
|
|
@@ -727,9 +511,9 @@
|
|
| 727 |
],
|
| 728 |
"metadata": {
|
| 729 |
"kernelspec": {
|
| 730 |
-
"display_name": "
|
| 731 |
"language": "python",
|
| 732 |
-
"name": "
|
| 733 |
},
|
| 734 |
"language_info": {
|
| 735 |
"codemirror_mode": {
|
|
|
|
| 5 |
"execution_count": 1,
|
| 6 |
"metadata": {},
|
| 7 |
"outputs": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8 |
{
|
| 9 |
"data": {
|
| 10 |
"application/vnd.jupyter.widget-view+json": {
|
| 11 |
+
"model_id": "442a2279299a4727a8f0fcf086cdd356",
|
| 12 |
"version_major": 2,
|
| 13 |
"version_minor": 0
|
| 14 |
},
|
|
|
|
| 363 |
},
|
| 364 |
{
|
| 365 |
"cell_type": "code",
|
| 366 |
+
"execution_count": 17,
|
| 367 |
"metadata": {},
|
| 368 |
"outputs": [],
|
| 369 |
"source": [
|
| 370 |
"from transformers import Seq2SeqTrainingArguments\n",
|
| 371 |
"\n",
|
| 372 |
"training_args = Seq2SeqTrainingArguments(\n",
|
| 373 |
+
" output_dir=\"./whisper-small-hi\", # change to a repo name of your choice\n",
|
| 374 |
" per_device_train_batch_size=4,\n",
|
| 375 |
+
" gradient_accumulation_steps=4, # increase by 2x for every 2x decrease in batch size\n",
|
| 376 |
" learning_rate=1e-5,\n",
|
| 377 |
" warmup_steps=500,\n",
|
| 378 |
" max_steps=1000,\n",
|
|
|
|
| 382 |
" per_device_eval_batch_size=2,\n",
|
| 383 |
" predict_with_generate=True,\n",
|
| 384 |
" generation_max_length=225,\n",
|
| 385 |
+
" save_steps=500,\n",
|
| 386 |
+
" eval_steps=500,\n",
|
| 387 |
" logging_steps=25,\n",
|
| 388 |
" report_to=[\"tensorboard\"],\n",
|
| 389 |
" load_best_model_at_end=True,\n",
|
|
|
|
| 395 |
},
|
| 396 |
{
|
| 397 |
"cell_type": "code",
|
| 398 |
+
"execution_count": 18,
|
| 399 |
"metadata": {},
|
| 400 |
"outputs": [],
|
| 401 |
"source": [
|
|
|
|
| 414 |
},
|
| 415 |
{
|
| 416 |
"cell_type": "code",
|
| 417 |
+
"execution_count": 19,
|
| 418 |
"metadata": {},
|
| 419 |
"outputs": [
|
| 420 |
{
|
| 421 |
"ename": "ValueError",
|
| 422 |
+
"evalue": "No valid checkpoint found in output directory (./whisper-small-hi)",
|
| 423 |
"output_type": "error",
|
| 424 |
"traceback": [
|
| 425 |
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
| 426 |
"\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)",
|
| 427 |
+
"\u001b[1;32m/u/11/zhangz13/unix/zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/asr.ipynb Cell 19\u001b[0m line \u001b[0;36m1\n\u001b[0;32m----> <a href='vscode-notebook-cell://ssh-remote%2Bsmurf/u/11/zhangz13/unix/zipei/ID2223_NEW/ID2223_TopGaming/Lab2/whisper_hi_test/asr.ipynb#X24sdnNjb2RlLXJlbW90ZQ%3D%3D?line=0'>1</a>\u001b[0m trainer\u001b[39m.\u001b[39;49mtrain(resume_from_checkpoint\u001b[39m=\u001b[39;49m\u001b[39mTrue\u001b[39;49;00m)\n",
|
| 428 |
+
"File \u001b[0;32m~/.conda/envs/id23/lib/python3.8/site-packages/transformers/trainer.py:1523\u001b[0m, in \u001b[0;36mTrainer.train\u001b[0;34m(self, resume_from_checkpoint, trial, ignore_keys_for_eval, **kwargs)\u001b[0m\n\u001b[1;32m 1521\u001b[0m resume_from_checkpoint \u001b[39m=\u001b[39m get_last_checkpoint(args\u001b[39m.\u001b[39moutput_dir)\n\u001b[1;32m 1522\u001b[0m \u001b[39mif\u001b[39;00m resume_from_checkpoint \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m:\n\u001b[0;32m-> 1523\u001b[0m \u001b[39mraise\u001b[39;00m \u001b[39mValueError\u001b[39;00m(\u001b[39mf\u001b[39m\u001b[39m\"\u001b[39m\u001b[39mNo valid checkpoint found in output directory (\u001b[39m\u001b[39m{\u001b[39;00margs\u001b[39m.\u001b[39moutput_dir\u001b[39m}\u001b[39;00m\u001b[39m)\u001b[39m\u001b[39m\"\u001b[39m)\n\u001b[1;32m 1525\u001b[0m \u001b[39mif\u001b[39;00m (\n\u001b[1;32m 1526\u001b[0m resume_from_checkpoint \u001b[39mis\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1527\u001b[0m \u001b[39mand\u001b[39;00m \u001b[39mnot\u001b[39;00m is_sagemaker_mp_enabled()\n\u001b[1;32m 1528\u001b[0m \u001b[39mand\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mis_deepspeed_enabled\n\u001b[1;32m 1529\u001b[0m \u001b[39mand\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mis_fsdp_enabled\n\u001b[1;32m 1530\u001b[0m ):\n\u001b[1;32m 1531\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_load_from_checkpoint(resume_from_checkpoint)\n",
|
| 429 |
+
"\u001b[0;31mValueError\u001b[0m: No valid checkpoint found in output directory (./whisper-small-hi)"
|
|
|
|
| 430 |
]
|
| 431 |
}
|
| 432 |
],
|
| 433 |
"source": [
|
| 434 |
+
"trainer.train(resume_from_checkpoint=True)"
|
| 435 |
]
|
| 436 |
},
|
| 437 |
{
|
|
|
|
| 439 |
"execution_count": null,
|
| 440 |
"metadata": {},
|
| 441 |
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 442 |
"source": [
|
| 443 |
"kwargs = {\n",
|
| 444 |
" \"dataset_tags\": \"mozilla-foundation/common_voice_11_0\",\n",
|
|
|
|
| 458 |
},
|
| 459 |
{
|
| 460 |
"cell_type": "code",
|
| 461 |
+
"execution_count": null,
|
| 462 |
"metadata": {},
|
| 463 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 464 |
"source": [
|
| 465 |
"from transformers import WhisperForConditionalGeneration, WhisperProcessor\n",
|
| 466 |
"\n",
|
| 467 |
+
"model = WhisperForConditionalGeneration.from_pretrained(\"Zipei-KTH/whisper-small-hi\")\n",
|
| 468 |
+
"processor = WhisperProcessor.from_pretrained(\"Zipei-KTH/whisper-small-hi\")\n"
|
| 469 |
]
|
| 470 |
},
|
| 471 |
{
|
|
|
|
| 511 |
],
|
| 512 |
"metadata": {
|
| 513 |
"kernelspec": {
|
| 514 |
+
"display_name": "dladenv",
|
| 515 |
"language": "python",
|
| 516 |
+
"name": "python3"
|
| 517 |
},
|
| 518 |
"language_info": {
|
| 519 |
"codemirror_mode": {
|
generation_config.json
ADDED
|
@@ -0,0 +1,263 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"alignment_heads": [
|
| 3 |
+
[
|
| 4 |
+
5,
|
| 5 |
+
3
|
| 6 |
+
],
|
| 7 |
+
[
|
| 8 |
+
5,
|
| 9 |
+
9
|
| 10 |
+
],
|
| 11 |
+
[
|
| 12 |
+
8,
|
| 13 |
+
0
|
| 14 |
+
],
|
| 15 |
+
[
|
| 16 |
+
8,
|
| 17 |
+
4
|
| 18 |
+
],
|
| 19 |
+
[
|
| 20 |
+
8,
|
| 21 |
+
7
|
| 22 |
+
],
|
| 23 |
+
[
|
| 24 |
+
8,
|
| 25 |
+
8
|
| 26 |
+
],
|
| 27 |
+
[
|
| 28 |
+
9,
|
| 29 |
+
0
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
9,
|
| 33 |
+
7
|
| 34 |
+
],
|
| 35 |
+
[
|
| 36 |
+
9,
|
| 37 |
+
9
|
| 38 |
+
],
|
| 39 |
+
[
|
| 40 |
+
10,
|
| 41 |
+
5
|
| 42 |
+
]
|
| 43 |
+
],
|
| 44 |
+
"begin_suppress_tokens": [
|
| 45 |
+
220,
|
| 46 |
+
50257
|
| 47 |
+
],
|
| 48 |
+
"bos_token_id": 50257,
|
| 49 |
+
"decoder_start_token_id": 50258,
|
| 50 |
+
"eos_token_id": 50257,
|
| 51 |
+
"forced_decoder_ids": [
|
| 52 |
+
[
|
| 53 |
+
1,
|
| 54 |
+
null
|
| 55 |
+
],
|
| 56 |
+
[
|
| 57 |
+
2,
|
| 58 |
+
50359
|
| 59 |
+
]
|
| 60 |
+
],
|
| 61 |
+
"is_multilingual": true,
|
| 62 |
+
"lang_to_id": {
|
| 63 |
+
"<|af|>": 50327,
|
| 64 |
+
"<|am|>": 50334,
|
| 65 |
+
"<|ar|>": 50272,
|
| 66 |
+
"<|as|>": 50350,
|
| 67 |
+
"<|az|>": 50304,
|
| 68 |
+
"<|ba|>": 50355,
|
| 69 |
+
"<|be|>": 50330,
|
| 70 |
+
"<|bg|>": 50292,
|
| 71 |
+
"<|bn|>": 50302,
|
| 72 |
+
"<|bo|>": 50347,
|
| 73 |
+
"<|br|>": 50309,
|
| 74 |
+
"<|bs|>": 50315,
|
| 75 |
+
"<|ca|>": 50270,
|
| 76 |
+
"<|cs|>": 50283,
|
| 77 |
+
"<|cy|>": 50297,
|
| 78 |
+
"<|da|>": 50285,
|
| 79 |
+
"<|de|>": 50261,
|
| 80 |
+
"<|el|>": 50281,
|
| 81 |
+
"<|en|>": 50259,
|
| 82 |
+
"<|es|>": 50262,
|
| 83 |
+
"<|et|>": 50307,
|
| 84 |
+
"<|eu|>": 50310,
|
| 85 |
+
"<|fa|>": 50300,
|
| 86 |
+
"<|fi|>": 50277,
|
| 87 |
+
"<|fo|>": 50338,
|
| 88 |
+
"<|fr|>": 50265,
|
| 89 |
+
"<|gl|>": 50319,
|
| 90 |
+
"<|gu|>": 50333,
|
| 91 |
+
"<|haw|>": 50352,
|
| 92 |
+
"<|ha|>": 50354,
|
| 93 |
+
"<|he|>": 50279,
|
| 94 |
+
"<|hi|>": 50276,
|
| 95 |
+
"<|hr|>": 50291,
|
| 96 |
+
"<|ht|>": 50339,
|
| 97 |
+
"<|hu|>": 50286,
|
| 98 |
+
"<|hy|>": 50312,
|
| 99 |
+
"<|id|>": 50275,
|
| 100 |
+
"<|is|>": 50311,
|
| 101 |
+
"<|it|>": 50274,
|
| 102 |
+
"<|ja|>": 50266,
|
| 103 |
+
"<|jw|>": 50356,
|
| 104 |
+
"<|ka|>": 50329,
|
| 105 |
+
"<|kk|>": 50316,
|
| 106 |
+
"<|km|>": 50323,
|
| 107 |
+
"<|kn|>": 50306,
|
| 108 |
+
"<|ko|>": 50264,
|
| 109 |
+
"<|la|>": 50294,
|
| 110 |
+
"<|lb|>": 50345,
|
| 111 |
+
"<|ln|>": 50353,
|
| 112 |
+
"<|lo|>": 50336,
|
| 113 |
+
"<|lt|>": 50293,
|
| 114 |
+
"<|lv|>": 50301,
|
| 115 |
+
"<|mg|>": 50349,
|
| 116 |
+
"<|mi|>": 50295,
|
| 117 |
+
"<|mk|>": 50308,
|
| 118 |
+
"<|ml|>": 50296,
|
| 119 |
+
"<|mn|>": 50314,
|
| 120 |
+
"<|mr|>": 50320,
|
| 121 |
+
"<|ms|>": 50282,
|
| 122 |
+
"<|mt|>": 50343,
|
| 123 |
+
"<|my|>": 50346,
|
| 124 |
+
"<|ne|>": 50313,
|
| 125 |
+
"<|nl|>": 50271,
|
| 126 |
+
"<|nn|>": 50342,
|
| 127 |
+
"<|no|>": 50288,
|
| 128 |
+
"<|oc|>": 50328,
|
| 129 |
+
"<|pa|>": 50321,
|
| 130 |
+
"<|pl|>": 50269,
|
| 131 |
+
"<|ps|>": 50340,
|
| 132 |
+
"<|pt|>": 50267,
|
| 133 |
+
"<|ro|>": 50284,
|
| 134 |
+
"<|ru|>": 50263,
|
| 135 |
+
"<|sa|>": 50344,
|
| 136 |
+
"<|sd|>": 50332,
|
| 137 |
+
"<|si|>": 50322,
|
| 138 |
+
"<|sk|>": 50298,
|
| 139 |
+
"<|sl|>": 50305,
|
| 140 |
+
"<|sn|>": 50324,
|
| 141 |
+
"<|so|>": 50326,
|
| 142 |
+
"<|sq|>": 50317,
|
| 143 |
+
"<|sr|>": 50303,
|
| 144 |
+
"<|su|>": 50357,
|
| 145 |
+
"<|sv|>": 50273,
|
| 146 |
+
"<|sw|>": 50318,
|
| 147 |
+
"<|ta|>": 50287,
|
| 148 |
+
"<|te|>": 50299,
|
| 149 |
+
"<|tg|>": 50331,
|
| 150 |
+
"<|th|>": 50289,
|
| 151 |
+
"<|tk|>": 50341,
|
| 152 |
+
"<|tl|>": 50348,
|
| 153 |
+
"<|tr|>": 50268,
|
| 154 |
+
"<|tt|>": 50351,
|
| 155 |
+
"<|uk|>": 50280,
|
| 156 |
+
"<|ur|>": 50290,
|
| 157 |
+
"<|uz|>": 50337,
|
| 158 |
+
"<|vi|>": 50278,
|
| 159 |
+
"<|yi|>": 50335,
|
| 160 |
+
"<|yo|>": 50325,
|
| 161 |
+
"<|zh|>": 50260
|
| 162 |
+
},
|
| 163 |
+
"max_initial_timestamp_index": 1,
|
| 164 |
+
"max_length": 448,
|
| 165 |
+
"no_timestamps_token_id": 50363,
|
| 166 |
+
"pad_token_id": 50257,
|
| 167 |
+
"return_timestamps": false,
|
| 168 |
+
"suppress_tokens": [
|
| 169 |
+
1,
|
| 170 |
+
2,
|
| 171 |
+
7,
|
| 172 |
+
8,
|
| 173 |
+
9,
|
| 174 |
+
10,
|
| 175 |
+
14,
|
| 176 |
+
25,
|
| 177 |
+
26,
|
| 178 |
+
27,
|
| 179 |
+
28,
|
| 180 |
+
29,
|
| 181 |
+
31,
|
| 182 |
+
58,
|
| 183 |
+
59,
|
| 184 |
+
60,
|
| 185 |
+
61,
|
| 186 |
+
62,
|
| 187 |
+
63,
|
| 188 |
+
90,
|
| 189 |
+
91,
|
| 190 |
+
92,
|
| 191 |
+
93,
|
| 192 |
+
359,
|
| 193 |
+
503,
|
| 194 |
+
522,
|
| 195 |
+
542,
|
| 196 |
+
873,
|
| 197 |
+
893,
|
| 198 |
+
902,
|
| 199 |
+
918,
|
| 200 |
+
922,
|
| 201 |
+
931,
|
| 202 |
+
1350,
|
| 203 |
+
1853,
|
| 204 |
+
1982,
|
| 205 |
+
2460,
|
| 206 |
+
2627,
|
| 207 |
+
3246,
|
| 208 |
+
3253,
|
| 209 |
+
3268,
|
| 210 |
+
3536,
|
| 211 |
+
3846,
|
| 212 |
+
3961,
|
| 213 |
+
4183,
|
| 214 |
+
4667,
|
| 215 |
+
6585,
|
| 216 |
+
6647,
|
| 217 |
+
7273,
|
| 218 |
+
9061,
|
| 219 |
+
9383,
|
| 220 |
+
10428,
|
| 221 |
+
10929,
|
| 222 |
+
11938,
|
| 223 |
+
12033,
|
| 224 |
+
12331,
|
| 225 |
+
12562,
|
| 226 |
+
13793,
|
| 227 |
+
14157,
|
| 228 |
+
14635,
|
| 229 |
+
15265,
|
| 230 |
+
15618,
|
| 231 |
+
16553,
|
| 232 |
+
16604,
|
| 233 |
+
18362,
|
| 234 |
+
18956,
|
| 235 |
+
20075,
|
| 236 |
+
21675,
|
| 237 |
+
22520,
|
| 238 |
+
26130,
|
| 239 |
+
26161,
|
| 240 |
+
26435,
|
| 241 |
+
28279,
|
| 242 |
+
29464,
|
| 243 |
+
31650,
|
| 244 |
+
32302,
|
| 245 |
+
32470,
|
| 246 |
+
36865,
|
| 247 |
+
42863,
|
| 248 |
+
47425,
|
| 249 |
+
49870,
|
| 250 |
+
50254,
|
| 251 |
+
50258,
|
| 252 |
+
50358,
|
| 253 |
+
50359,
|
| 254 |
+
50360,
|
| 255 |
+
50361,
|
| 256 |
+
50362
|
| 257 |
+
],
|
| 258 |
+
"task_to_id": {
|
| 259 |
+
"transcribe": 50359,
|
| 260 |
+
"translate": 50358
|
| 261 |
+
},
|
| 262 |
+
"transformers_version": "4.35.2"
|
| 263 |
+
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 966995080
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fea79cc5083d62d74deb57dacf19ff302c9e320e987f7dccfc49d55b2b84c2da
|
| 3 |
size 966995080
|
runs/Dec07_01-11-40_smurf/events.out.tfevents.1701904301.smurf.965337.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df55c01598422289195729096a6050f903a812c34a2e6bf0c288e901b730855c
|
| 3 |
+
size 17893
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4728
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e29181f470382fce52e35a2769c9ed58dabf92a7ebfe37f86e4a495bbe2dd96a
|
| 3 |
size 4728
|