Commit Β·
56112cf
1
Parent(s): 376067a
End of training
Browse files- trainv1.ipynb +22 -36
trainv1.ipynb
CHANGED
|
@@ -62007,14 +62007,14 @@
|
|
| 62007 |
},
|
| 62008 |
{
|
| 62009 |
"cell_type": "code",
|
| 62010 |
-
"execution_count":
|
| 62011 |
"id": "606258de-cd15-43e4-8960-52ee02b9cab5",
|
| 62012 |
"metadata": {},
|
| 62013 |
"outputs": [],
|
| 62014 |
"source": [
|
| 62015 |
"kwargs = {\n",
|
| 62016 |
-
" \"dataset_tags\": \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\",\n",
|
| 62017 |
-
" \"dataset\": \"Common Voice 11.0, Fleurs, SLR69, tb3_parla, parlament_parla\", \n",
|
| 62018 |
" \"language\": \"ca\",\n",
|
| 62019 |
" \"model_name\": \"Whisper Medium Ca\",\n",
|
| 62020 |
" \"finetuned_from\": \"openai/whisper-medium\",\n",
|
|
@@ -62025,7 +62025,7 @@
|
|
| 62025 |
},
|
| 62026 |
{
|
| 62027 |
"cell_type": "code",
|
| 62028 |
-
"execution_count":
|
| 62029 |
"id": "31305933-9906-4131-aa4e-6a6a53f4b7cb",
|
| 62030 |
"metadata": {},
|
| 62031 |
"outputs": [
|
|
@@ -62040,18 +62040,8 @@
|
|
| 62040 |
"tokenizer config file saved in ./tokenizer_config.json\n",
|
| 62041 |
"Special tokens file saved in ./special_tokens_map.json\n",
|
| 62042 |
"added tokens file saved in ./added_tokens.json\n",
|
| 62043 |
-
"
|
| 62044 |
-
"
|
| 62045 |
-
"remote: LFS file scan complete. \n",
|
| 62046 |
-
"To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
|
| 62047 |
-
" 5f39e50..d5bf59f main -> main\n",
|
| 62048 |
-
"\n",
|
| 62049 |
-
"Upload file pytorch_model.bin: 100%|ββββββββββ| 2.85G/2.85G [01:10<00:00, 43.4MB/s]\n",
|
| 62050 |
-
"\n",
|
| 62051 |
-
"Upload file runs/Dec17_13-19-25_129-146-107-233/events.out.tfevents.1671283218.129-146-107-233.68679.0: 100%|ββββββββββ| 18.9k/18.9k [01:10<?, ?B/s]\u001b[A\n",
|
| 62052 |
-
"Upload file runs/Dec17_13-19-25_129-146-107-233/events.out.tfevents.1671283218.129-146-107-233.68679.0: 100%|ββββββββββ| 18.9k/18.9k [01:10<?, ?B/s]\u001b[A\n",
|
| 62053 |
-
"Dropping the following result as it does not have all the necessary fields:\n",
|
| 62054 |
-
"{'task': {'name': 'Automatic Speech Recognition', 'type': 'automatic-speech-recognition'}, 'dataset': {'name': 'Common Voice 11.0, Fleurs, SLR69, tb3_parla, parlament_parla', 'type': 'mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla', 'config': 'ca', 'split': 'test', 'args': 'ca'}}\n",
|
| 62055 |
"remote: ----------------------------------------------------------\u001b[0;31m \n",
|
| 62056 |
"remote: Sorry, your push was rejected during YAML metadata verification: \n",
|
| 62057 |
"remote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \n",
|
|
@@ -62062,30 +62052,26 @@
|
|
| 62062 |
"To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
|
| 62063 |
" ! [remote rejected] main -> main (pre-receive hook declined)\n",
|
| 62064 |
"error: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
|
| 62065 |
-
"\n",
|
| 62066 |
-
"Error pushing update to the model card. Please read logs and retry.\n",
|
| 62067 |
-
"$remote: ----------------------------------------------------------\u001b[0;31m \n",
|
| 62068 |
-
"remote: Sorry, your push was rejected during YAML metadata verification: \n",
|
| 62069 |
-
"remote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \n",
|
| 62070 |
-
"remote: ---------------------------------------------------------- \n",
|
| 62071 |
-
"remote: Please find the documentation at: \n",
|
| 62072 |
-
"remote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \n",
|
| 62073 |
-
"remote: ---------------------------------------------------------- \n",
|
| 62074 |
-
"To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
|
| 62075 |
-
" ! [remote rejected] main -> main (pre-receive hook declined)\n",
|
| 62076 |
-
"error: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
|
| 62077 |
"\n"
|
| 62078 |
]
|
| 62079 |
},
|
| 62080 |
{
|
| 62081 |
-
"
|
| 62082 |
-
|
| 62083 |
-
|
| 62084 |
-
|
| 62085 |
-
|
| 62086 |
-
|
| 62087 |
-
|
| 62088 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 62089 |
}
|
| 62090 |
],
|
| 62091 |
"source": [
|
|
|
|
| 62007 |
},
|
| 62008 |
{
|
| 62009 |
"cell_type": "code",
|
| 62010 |
+
"execution_count": 39,
|
| 62011 |
"id": "606258de-cd15-43e4-8960-52ee02b9cab5",
|
| 62012 |
"metadata": {},
|
| 62013 |
"outputs": [],
|
| 62014 |
"source": [
|
| 62015 |
"kwargs = {\n",
|
| 62016 |
+
" \"dataset_tags\": [\"mozilla-foundation/common_voice_11_0\", \"google/fleurs\", \"openslr\", \"collectivat/tv3_parla\", \"projecte-aina/parlament_parla\"],\n",
|
| 62017 |
+
" \"dataset\": [\"Common Voice 11.0\", \"Fleurs\", \"SLR69\", \"tb3_parla\", \"parlament_parla\"], \n",
|
| 62018 |
" \"language\": \"ca\",\n",
|
| 62019 |
" \"model_name\": \"Whisper Medium Ca\",\n",
|
| 62020 |
" \"finetuned_from\": \"openai/whisper-medium\",\n",
|
|
|
|
| 62025 |
},
|
| 62026 |
{
|
| 62027 |
"cell_type": "code",
|
| 62028 |
+
"execution_count": 40,
|
| 62029 |
"id": "31305933-9906-4131-aa4e-6a6a53f4b7cb",
|
| 62030 |
"metadata": {},
|
| 62031 |
"outputs": [
|
|
|
|
| 62040 |
"tokenizer config file saved in ./tokenizer_config.json\n",
|
| 62041 |
"Special tokens file saved in ./special_tokens_map.json\n",
|
| 62042 |
"added tokens file saved in ./added_tokens.json\n",
|
| 62043 |
+
"Several commits (2) will be pushed upstream.\n",
|
| 62044 |
+
"The progress bars may be unreliable.\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 62045 |
"remote: ----------------------------------------------------------\u001b[0;31m \n",
|
| 62046 |
"remote: Sorry, your push was rejected during YAML metadata verification: \n",
|
| 62047 |
"remote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \n",
|
|
|
|
| 62052 |
"To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
|
| 62053 |
" ! [remote rejected] main -> main (pre-receive hook declined)\n",
|
| 62054 |
"error: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 62055 |
"\n"
|
| 62056 |
]
|
| 62057 |
},
|
| 62058 |
{
|
| 62059 |
+
"ename": "OSError",
|
| 62060 |
+
"evalue": "remote: ----------------------------------------------------------\u001b[0;31m \nremote: Sorry, your push was rejected during YAML metadata verification: \nremote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \nremote: ---------------------------------------------------------- \nremote: Please find the documentation at: \nremote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \nremote: ---------------------------------------------------------- \nTo https://huggingface.co/JulioCastro/whisper-medium-ca\n ! [remote rejected] main -> main (pre-receive hook declined)\nerror: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
|
| 62061 |
+
"output_type": "error",
|
| 62062 |
+
"traceback": [
|
| 62063 |
+
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
| 62064 |
+
"\u001b[0;31mCalledProcessError\u001b[0m Traceback (most recent call last)",
|
| 62065 |
+
"File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/huggingface_hub/repository.py:1207\u001b[0m, in \u001b[0;36mRepository.git_push\u001b[0;34m(self, upstream, blocking, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1206\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m return_code:\n\u001b[0;32m-> 1207\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError(\n\u001b[1;32m 1208\u001b[0m return_code, process\u001b[38;5;241m.\u001b[39margs, output\u001b[38;5;241m=\u001b[39mstdout, stderr\u001b[38;5;241m=\u001b[39mstderr\n\u001b[1;32m 1209\u001b[0m )\n\u001b[1;32m 1211\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError \u001b[38;5;28;01mas\u001b[39;00m exc:\n",
|
| 62066 |
+
"\u001b[0;31mCalledProcessError\u001b[0m: Command '['git', 'push', '--set-upstream', 'origin', 'main']' returned non-zero exit status 1.",
|
| 62067 |
+
"\nDuring handling of the above exception, another exception occurred:\n",
|
| 62068 |
+
"\u001b[0;31mOSError\u001b[0m Traceback (most recent call last)",
|
| 62069 |
+
"Cell \u001b[0;32mIn[40], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mpush_to_hub\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
|
| 62070 |
+
"File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/transformers/trainer.py:3491\u001b[0m, in \u001b[0;36mTrainer.push_to_hub\u001b[0;34m(self, commit_message, blocking, **kwargs)\u001b[0m\n\u001b[1;32m 3488\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpush_in_progress\u001b[38;5;241m.\u001b[39m_process\u001b[38;5;241m.\u001b[39mkill()\n\u001b[1;32m 3489\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpush_in_progress \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n\u001b[0;32m-> 3491\u001b[0m git_head_commit_url \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrepo\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mpush_to_hub\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 3492\u001b[0m \u001b[43m \u001b[49m\u001b[43mcommit_message\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcommit_message\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mblocking\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mblocking\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\n\u001b[1;32m 3493\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 3494\u001b[0m \u001b[38;5;66;03m# push separately the model card to be independant from the rest of the model\u001b[39;00m\n\u001b[1;32m 3495\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39margs\u001b[38;5;241m.\u001b[39mshould_save:\n",
|
| 62071 |
+
"File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/huggingface_hub/repository.py:1432\u001b[0m, in \u001b[0;36mRepository.push_to_hub\u001b[0;34m(self, commit_message, blocking, clean_ok, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1430\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgit_add(auto_lfs_track\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m)\n\u001b[1;32m 1431\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgit_commit(commit_message)\n\u001b[0;32m-> 1432\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mgit_push\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 1433\u001b[0m \u001b[43m \u001b[49m\u001b[43mupstream\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43mf\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43morigin \u001b[39;49m\u001b[38;5;132;43;01m{\u001b[39;49;00m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mcurrent_branch\u001b[49m\u001b[38;5;132;43;01m}\u001b[39;49;00m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1434\u001b[0m \u001b[43m \u001b[49m\u001b[43mblocking\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mblocking\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1435\u001b[0m \u001b[43m \u001b[49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1436\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n",
|
| 62072 |
+
"File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/huggingface_hub/repository.py:1212\u001b[0m, in \u001b[0;36mRepository.git_push\u001b[0;34m(self, upstream, blocking, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1207\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError(\n\u001b[1;32m 1208\u001b[0m return_code, process\u001b[38;5;241m.\u001b[39margs, output\u001b[38;5;241m=\u001b[39mstdout, stderr\u001b[38;5;241m=\u001b[39mstderr\n\u001b[1;32m 1209\u001b[0m )\n\u001b[1;32m 1211\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError \u001b[38;5;28;01mas\u001b[39;00m exc:\n\u001b[0;32m-> 1212\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mEnvironmentError\u001b[39;00m(exc\u001b[38;5;241m.\u001b[39mstderr)\n\u001b[1;32m 1214\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m blocking:\n\u001b[1;32m 1216\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mstatus_method\u001b[39m():\n",
|
| 62073 |
+
"\u001b[0;31mOSError\u001b[0m: remote: ----------------------------------------------------------\u001b[0;31m \nremote: Sorry, your push was rejected during YAML metadata verification: \nremote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \nremote: ---------------------------------------------------------- \nremote: Please find the documentation at: \nremote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \nremote: ---------------------------------------------------------- \nTo https://huggingface.co/JulioCastro/whisper-medium-ca\n ! [remote rejected] main -> main (pre-receive hook declined)\nerror: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n"
|
| 62074 |
+
]
|
| 62075 |
}
|
| 62076 |
],
|
| 62077 |
"source": [
|