JulioCastro commited on
Commit
56112cf
Β·
1 Parent(s): 376067a

End of training

Browse files
Files changed (1) hide show
  1. trainv1.ipynb +22 -36
trainv1.ipynb CHANGED
@@ -62007,14 +62007,14 @@
62007
  },
62008
  {
62009
  "cell_type": "code",
62010
- "execution_count": 36,
62011
  "id": "606258de-cd15-43e4-8960-52ee02b9cab5",
62012
  "metadata": {},
62013
  "outputs": [],
62014
  "source": [
62015
  "kwargs = {\n",
62016
- " \"dataset_tags\": \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\",\n",
62017
- " \"dataset\": \"Common Voice 11.0, Fleurs, SLR69, tb3_parla, parlament_parla\", \n",
62018
  " \"language\": \"ca\",\n",
62019
  " \"model_name\": \"Whisper Medium Ca\",\n",
62020
  " \"finetuned_from\": \"openai/whisper-medium\",\n",
@@ -62025,7 +62025,7 @@
62025
  },
62026
  {
62027
  "cell_type": "code",
62028
- "execution_count": 37,
62029
  "id": "31305933-9906-4131-aa4e-6a6a53f4b7cb",
62030
  "metadata": {},
62031
  "outputs": [
@@ -62040,18 +62040,8 @@
62040
  "tokenizer config file saved in ./tokenizer_config.json\n",
62041
  "Special tokens file saved in ./special_tokens_map.json\n",
62042
  "added tokens file saved in ./added_tokens.json\n",
62043
- "Upload file pytorch_model.bin: 0%| | 32.0k/2.85G [00:00<?, ?B/s]\n",
62044
- "Upload file pytorch_model.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.84G/2.85G [01:06<00:00, 55.2MB/s]146-107-233.68679.0: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 18.9k/18.9k [00:00<?, ?B/s]\u001b[Aremote: Scanning LFS files for validity, may be slow... \n",
62045
- "remote: LFS file scan complete. \n",
62046
- "To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
62047
- " 5f39e50..d5bf59f main -> main\n",
62048
- "\n",
62049
- "Upload file pytorch_model.bin: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.85G/2.85G [01:10<00:00, 43.4MB/s]\n",
62050
- "\n",
62051
- "Upload file runs/Dec17_13-19-25_129-146-107-233/events.out.tfevents.1671283218.129-146-107-233.68679.0: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 18.9k/18.9k [01:10<?, ?B/s]\u001b[A\n",
62052
- "Upload file runs/Dec17_13-19-25_129-146-107-233/events.out.tfevents.1671283218.129-146-107-233.68679.0: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 18.9k/18.9k [01:10<?, ?B/s]\u001b[A\n",
62053
- "Dropping the following result as it does not have all the necessary fields:\n",
62054
- "{'task': {'name': 'Automatic Speech Recognition', 'type': 'automatic-speech-recognition'}, 'dataset': {'name': 'Common Voice 11.0, Fleurs, SLR69, tb3_parla, parlament_parla', 'type': 'mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla', 'config': 'ca', 'split': 'test', 'args': 'ca'}}\n",
62055
  "remote: ----------------------------------------------------------\u001b[0;31m \n",
62056
  "remote: Sorry, your push was rejected during YAML metadata verification: \n",
62057
  "remote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \n",
@@ -62062,30 +62052,26 @@
62062
  "To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
62063
  " ! [remote rejected] main -> main (pre-receive hook declined)\n",
62064
  "error: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
62065
- "\n",
62066
- "Error pushing update to the model card. Please read logs and retry.\n",
62067
- "$remote: ----------------------------------------------------------\u001b[0;31m \n",
62068
- "remote: Sorry, your push was rejected during YAML metadata verification: \n",
62069
- "remote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \n",
62070
- "remote: ---------------------------------------------------------- \n",
62071
- "remote: Please find the documentation at: \n",
62072
- "remote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \n",
62073
- "remote: ---------------------------------------------------------- \n",
62074
- "To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
62075
- " ! [remote rejected] main -> main (pre-receive hook declined)\n",
62076
- "error: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
62077
  "\n"
62078
  ]
62079
  },
62080
  {
62081
- "data": {
62082
- "text/plain": [
62083
- "'https://huggingface.co/JulioCastro/whisper-medium-ca/commit/d5bf59fe2836dc4c05f6961d7fbfb66fb0800b51'"
62084
- ]
62085
- },
62086
- "execution_count": 37,
62087
- "metadata": {},
62088
- "output_type": "execute_result"
 
 
 
 
 
 
 
 
62089
  }
62090
  ],
62091
  "source": [
 
62007
  },
62008
  {
62009
  "cell_type": "code",
62010
+ "execution_count": 39,
62011
  "id": "606258de-cd15-43e4-8960-52ee02b9cab5",
62012
  "metadata": {},
62013
  "outputs": [],
62014
  "source": [
62015
  "kwargs = {\n",
62016
+ " \"dataset_tags\": [\"mozilla-foundation/common_voice_11_0\", \"google/fleurs\", \"openslr\", \"collectivat/tv3_parla\", \"projecte-aina/parlament_parla\"],\n",
62017
+ " \"dataset\": [\"Common Voice 11.0\", \"Fleurs\", \"SLR69\", \"tb3_parla\", \"parlament_parla\"], \n",
62018
  " \"language\": \"ca\",\n",
62019
  " \"model_name\": \"Whisper Medium Ca\",\n",
62020
  " \"finetuned_from\": \"openai/whisper-medium\",\n",
 
62025
  },
62026
  {
62027
  "cell_type": "code",
62028
+ "execution_count": 40,
62029
  "id": "31305933-9906-4131-aa4e-6a6a53f4b7cb",
62030
  "metadata": {},
62031
  "outputs": [
 
62040
  "tokenizer config file saved in ./tokenizer_config.json\n",
62041
  "Special tokens file saved in ./special_tokens_map.json\n",
62042
  "added tokens file saved in ./added_tokens.json\n",
62043
+ "Several commits (2) will be pushed upstream.\n",
62044
+ "The progress bars may be unreliable.\n",
 
 
 
 
 
 
 
 
 
 
62045
  "remote: ----------------------------------------------------------\u001b[0;31m \n",
62046
  "remote: Sorry, your push was rejected during YAML metadata verification: \n",
62047
  "remote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \n",
 
62052
  "To https://huggingface.co/JulioCastro/whisper-medium-ca\n",
62053
  " ! [remote rejected] main -> main (pre-receive hook declined)\n",
62054
  "error: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
 
 
 
 
 
 
 
 
 
 
 
 
62055
  "\n"
62056
  ]
62057
  },
62058
  {
62059
+ "ename": "OSError",
62060
+ "evalue": "remote: ----------------------------------------------------------\u001b[0;31m \nremote: Sorry, your push was rejected during YAML metadata verification: \nremote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \nremote: ---------------------------------------------------------- \nremote: Please find the documentation at: \nremote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \nremote: ---------------------------------------------------------- \nTo https://huggingface.co/JulioCastro/whisper-medium-ca\n ! [remote rejected] main -> main (pre-receive hook declined)\nerror: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n",
62061
+ "output_type": "error",
62062
+ "traceback": [
62063
+ "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
62064
+ "\u001b[0;31mCalledProcessError\u001b[0m Traceback (most recent call last)",
62065
+ "File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/huggingface_hub/repository.py:1207\u001b[0m, in \u001b[0;36mRepository.git_push\u001b[0;34m(self, upstream, blocking, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1206\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m return_code:\n\u001b[0;32m-> 1207\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError(\n\u001b[1;32m 1208\u001b[0m return_code, process\u001b[38;5;241m.\u001b[39margs, output\u001b[38;5;241m=\u001b[39mstdout, stderr\u001b[38;5;241m=\u001b[39mstderr\n\u001b[1;32m 1209\u001b[0m )\n\u001b[1;32m 1211\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError \u001b[38;5;28;01mas\u001b[39;00m exc:\n",
62066
+ "\u001b[0;31mCalledProcessError\u001b[0m: Command '['git', 'push', '--set-upstream', 'origin', 'main']' returned non-zero exit status 1.",
62067
+ "\nDuring handling of the above exception, another exception occurred:\n",
62068
+ "\u001b[0;31mOSError\u001b[0m Traceback (most recent call last)",
62069
+ "Cell \u001b[0;32mIn[40], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mpush_to_hub\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
62070
+ "File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/transformers/trainer.py:3491\u001b[0m, in \u001b[0;36mTrainer.push_to_hub\u001b[0;34m(self, commit_message, blocking, **kwargs)\u001b[0m\n\u001b[1;32m 3488\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpush_in_progress\u001b[38;5;241m.\u001b[39m_process\u001b[38;5;241m.\u001b[39mkill()\n\u001b[1;32m 3489\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpush_in_progress \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n\u001b[0;32m-> 3491\u001b[0m git_head_commit_url \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrepo\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mpush_to_hub\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 3492\u001b[0m \u001b[43m \u001b[49m\u001b[43mcommit_message\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcommit_message\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mblocking\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mblocking\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\n\u001b[1;32m 3493\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 3494\u001b[0m \u001b[38;5;66;03m# push separately the model card to be independant from the rest of the model\u001b[39;00m\n\u001b[1;32m 3495\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39margs\u001b[38;5;241m.\u001b[39mshould_save:\n",
62071
+ "File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/huggingface_hub/repository.py:1432\u001b[0m, in \u001b[0;36mRepository.push_to_hub\u001b[0;34m(self, commit_message, blocking, clean_ok, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1430\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgit_add(auto_lfs_track\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m)\n\u001b[1;32m 1431\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgit_commit(commit_message)\n\u001b[0;32m-> 1432\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mgit_push\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 1433\u001b[0m \u001b[43m \u001b[49m\u001b[43mupstream\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43mf\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43morigin \u001b[39;49m\u001b[38;5;132;43;01m{\u001b[39;49;00m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mcurrent_branch\u001b[49m\u001b[38;5;132;43;01m}\u001b[39;49;00m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1434\u001b[0m \u001b[43m \u001b[49m\u001b[43mblocking\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mblocking\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1435\u001b[0m \u001b[43m \u001b[49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1436\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n",
62072
+ "File \u001b[0;32m~/hf_env/lib/python3.8/site-packages/huggingface_hub/repository.py:1212\u001b[0m, in \u001b[0;36mRepository.git_push\u001b[0;34m(self, upstream, blocking, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1207\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError(\n\u001b[1;32m 1208\u001b[0m return_code, process\u001b[38;5;241m.\u001b[39margs, output\u001b[38;5;241m=\u001b[39mstdout, stderr\u001b[38;5;241m=\u001b[39mstderr\n\u001b[1;32m 1209\u001b[0m )\n\u001b[1;32m 1211\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError \u001b[38;5;28;01mas\u001b[39;00m exc:\n\u001b[0;32m-> 1212\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mEnvironmentError\u001b[39;00m(exc\u001b[38;5;241m.\u001b[39mstderr)\n\u001b[1;32m 1214\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m blocking:\n\u001b[1;32m 1216\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mstatus_method\u001b[39m():\n",
62073
+ "\u001b[0;31mOSError\u001b[0m: remote: ----------------------------------------------------------\u001b[0;31m \nremote: Sorry, your push was rejected during YAML metadata verification: \nremote: - Error: \"datasets[0]\" with value \"mozilla-foundation/common_voice_11_0, google/fleurs, openslr, collectivat/tv3_parla, projecte-aina/parlament_parla\" is not valid. It should not contain any whitespace. If possible, use a dataset id from the huggingface Hub.\u001b[0;32m \nremote: ---------------------------------------------------------- \nremote: Please find the documentation at: \nremote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \nremote: ---------------------------------------------------------- \nTo https://huggingface.co/JulioCastro/whisper-medium-ca\n ! [remote rejected] main -> main (pre-receive hook declined)\nerror: failed to push some refs to 'https://huggingface.co/JulioCastro/whisper-medium-ca'\n"
62074
+ ]
62075
  }
62076
  ],
62077
  "source": [