End of training
Browse files
fine-tune-whisper-streaming.ipynb
CHANGED
@@ -1115,7 +1115,7 @@
|
|
1115 |
},
|
1116 |
{
|
1117 |
"cell_type": "code",
|
1118 |
-
"execution_count":
|
1119 |
"id": "6dd0e310-9b07-4133-ac14-2ed2d7524e22",
|
1120 |
"metadata": {},
|
1121 |
"outputs": [],
|
@@ -1141,7 +1141,7 @@
|
|
1141 |
},
|
1142 |
{
|
1143 |
"cell_type": "code",
|
1144 |
-
"execution_count":
|
1145 |
"id": "95737cda-c5dd-4887-a4d0-dfcb0d61d977",
|
1146 |
"metadata": {},
|
1147 |
"outputs": [
|
@@ -1155,32 +1155,20 @@
|
|
1155 |
"Feature extractor saved in ./preprocessor_config.json\n",
|
1156 |
"tokenizer config file saved in ./tokenizer_config.json\n",
|
1157 |
"Special tokens file saved in ./special_tokens_map.json\n",
|
1158 |
-
"added tokens file saved in ./added_tokens.json\n"
|
|
|
|
|
1159 |
]
|
1160 |
},
|
1161 |
{
|
1162 |
"data": {
|
1163 |
"application/vnd.jupyter.widget-view+json": {
|
1164 |
-
"model_id": "
|
1165 |
-
"version_major": 2,
|
1166 |
-
"version_minor": 0
|
1167 |
-
},
|
1168 |
-
"text/plain": [
|
1169 |
-
"Upload file pytorch_model.bin: 0%| | 32.0k/922M [00:00<?, ?B/s]"
|
1170 |
-
]
|
1171 |
-
},
|
1172 |
-
"metadata": {},
|
1173 |
-
"output_type": "display_data"
|
1174 |
-
},
|
1175 |
-
{
|
1176 |
-
"data": {
|
1177 |
-
"application/vnd.jupyter.widget-view+json": {
|
1178 |
-
"model_id": "1c58442a44e84af9a6dff915e036de83",
|
1179 |
"version_major": 2,
|
1180 |
"version_minor": 0
|
1181 |
},
|
1182 |
"text/plain": [
|
1183 |
-
"Upload file
|
1184 |
]
|
1185 |
},
|
1186 |
"metadata": {},
|
@@ -1192,11 +1180,6 @@
|
|
1192 |
"text": [
|
1193 |
"remote: Scanning LFS files for validity, may be slow... \n",
|
1194 |
"remote: LFS file scan complete. \n",
|
1195 |
-
"To https://huggingface.co/kimbochen/whisper-small-zh-tw\n",
|
1196 |
-
" 2ee4cf3..214645d main -> main\n",
|
1197 |
-
"\n",
|
1198 |
-
"Dropping the following result as it does not have all the necessary fields:\n",
|
1199 |
-
"{'task': {'name': 'Automatic Speech Recognition', 'type': 'automatic-speech-recognition'}, 'dataset': {'name': 'Common Voice 11.0', 'type': 'mozilla-foundation/common_voice_11_0', 'config': 'zh-TW', 'split': 'test', 'args': 'zh-TW'}}\n",
|
1200 |
"remote: ----------------------------------------------------------\u001b[0;31m \n",
|
1201 |
"remote: Sorry, your push was rejected during YAML metadata verification: \n",
|
1202 |
"remote: - Error: \"language[0]\" must only contain lowercase characters \n",
|
@@ -1208,31 +1191,26 @@
|
|
1208 |
"To https://huggingface.co/kimbochen/whisper-small-zh-tw\n",
|
1209 |
" ! [remote rejected] main -> main (pre-receive hook declined)\n",
|
1210 |
"error: failed to push some refs to 'https://huggingface.co/kimbochen/whisper-small-zh-tw'\n",
|
1211 |
-
"\n",
|
1212 |
-
"Error pushing update to the model card. Please read logs and retry.\n",
|
1213 |
-
"$remote: ----------------------------------------------------------\u001b[0;31m \n",
|
1214 |
-
"remote: Sorry, your push was rejected during YAML metadata verification: \n",
|
1215 |
-
"remote: - Error: \"language[0]\" must only contain lowercase characters \n",
|
1216 |
-
"remote: - Error: \"language[0]\" with value \"zh-TW\" is not valid. It must be an ISO 639-1, 639-2 or 639-3 code (two/three letters), or a special value like \"code\", \"multilingual\". If you want to use BCP-47 identifiers, you can specify them in language_bcp47.\u001b[0;32m \n",
|
1217 |
-
"remote: ---------------------------------------------------------- \n",
|
1218 |
-
"remote: Please find the documentation at: \n",
|
1219 |
-
"remote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \n",
|
1220 |
-
"remote: ---------------------------------------------------------- \n",
|
1221 |
-
"To https://huggingface.co/kimbochen/whisper-small-zh-tw\n",
|
1222 |
-
" ! [remote rejected] main -> main (pre-receive hook declined)\n",
|
1223 |
-
"error: failed to push some refs to 'https://huggingface.co/kimbochen/whisper-small-zh-tw'\n",
|
1224 |
"\n"
|
1225 |
]
|
1226 |
},
|
1227 |
{
|
1228 |
-
"
|
1229 |
-
|
1230 |
-
|
1231 |
-
|
1232 |
-
|
1233 |
-
|
1234 |
-
|
1235 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1236 |
}
|
1237 |
],
|
1238 |
"source": [
|
|
|
1115 |
},
|
1116 |
{
|
1117 |
"cell_type": "code",
|
1118 |
+
"execution_count": 25,
|
1119 |
"id": "6dd0e310-9b07-4133-ac14-2ed2d7524e22",
|
1120 |
"metadata": {},
|
1121 |
"outputs": [],
|
|
|
1141 |
},
|
1142 |
{
|
1143 |
"cell_type": "code",
|
1144 |
+
"execution_count": 26,
|
1145 |
"id": "95737cda-c5dd-4887-a4d0-dfcb0d61d977",
|
1146 |
"metadata": {},
|
1147 |
"outputs": [
|
|
|
1155 |
"Feature extractor saved in ./preprocessor_config.json\n",
|
1156 |
"tokenizer config file saved in ./tokenizer_config.json\n",
|
1157 |
"Special tokens file saved in ./special_tokens_map.json\n",
|
1158 |
+
"added tokens file saved in ./added_tokens.json\n",
|
1159 |
+
"Several commits (7) will be pushed upstream.\n",
|
1160 |
+
"The progress bars may be unreliable.\n"
|
1161 |
]
|
1162 |
},
|
1163 |
{
|
1164 |
"data": {
|
1165 |
"application/vnd.jupyter.widget-view+json": {
|
1166 |
+
"model_id": "e28b4896bb24431abb53886d20f8b826",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1167 |
"version_major": 2,
|
1168 |
"version_minor": 0
|
1169 |
},
|
1170 |
"text/plain": [
|
1171 |
+
"Upload file runs/Dec10_02-58-52_129-213-89-27/events.out.tfevents.1670641248.129-213-89-27.128858.0: 87%|####…"
|
1172 |
]
|
1173 |
},
|
1174 |
"metadata": {},
|
|
|
1180 |
"text": [
|
1181 |
"remote: Scanning LFS files for validity, may be slow... \n",
|
1182 |
"remote: LFS file scan complete. \n",
|
|
|
|
|
|
|
|
|
|
|
1183 |
"remote: ----------------------------------------------------------\u001b[0;31m \n",
|
1184 |
"remote: Sorry, your push was rejected during YAML metadata verification: \n",
|
1185 |
"remote: - Error: \"language[0]\" must only contain lowercase characters \n",
|
|
|
1191 |
"To https://huggingface.co/kimbochen/whisper-small-zh-tw\n",
|
1192 |
" ! [remote rejected] main -> main (pre-receive hook declined)\n",
|
1193 |
"error: failed to push some refs to 'https://huggingface.co/kimbochen/whisper-small-zh-tw'\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1194 |
"\n"
|
1195 |
]
|
1196 |
},
|
1197 |
{
|
1198 |
+
"ename": "OSError",
|
1199 |
+
"evalue": "remote: Scanning LFS files for validity, may be slow... \nremote: LFS file scan complete. \nremote: ----------------------------------------------------------\u001b[0;31m \nremote: Sorry, your push was rejected during YAML metadata verification: \nremote: - Error: \"language[0]\" must only contain lowercase characters \nremote: - Error: \"language[0]\" with value \"zh-TW\" is not valid. It must be an ISO 639-1, 639-2 or 639-3 code (two/three letters), or a special value like \"code\", \"multilingual\". If you want to use BCP-47 identifiers, you can specify them in language_bcp47.\u001b[0;32m \nremote: ---------------------------------------------------------- \nremote: Please find the documentation at: \nremote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \nremote: ---------------------------------------------------------- \nTo https://huggingface.co/kimbochen/whisper-small-zh-tw\n ! [remote rejected] main -> main (pre-receive hook declined)\nerror: failed to push some refs to 'https://huggingface.co/kimbochen/whisper-small-zh-tw'\n",
|
1200 |
+
"output_type": "error",
|
1201 |
+
"traceback": [
|
1202 |
+
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
1203 |
+
"\u001b[0;31mCalledProcessError\u001b[0m Traceback (most recent call last)",
|
1204 |
+
"File \u001b[0;32m~/.venv/lib/python3.8/site-packages/huggingface_hub/repository.py:1207\u001b[0m, in \u001b[0;36mRepository.git_push\u001b[0;34m(self, upstream, blocking, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1206\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m return_code:\n\u001b[0;32m-> 1207\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError(\n\u001b[1;32m 1208\u001b[0m return_code, process\u001b[38;5;241m.\u001b[39margs, output\u001b[38;5;241m=\u001b[39mstdout, stderr\u001b[38;5;241m=\u001b[39mstderr\n\u001b[1;32m 1209\u001b[0m )\n\u001b[1;32m 1211\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError \u001b[38;5;28;01mas\u001b[39;00m exc:\n",
|
1205 |
+
"\u001b[0;31mCalledProcessError\u001b[0m: Command '['git', 'push', '--set-upstream', 'origin', 'main']' returned non-zero exit status 1.",
|
1206 |
+
"\nDuring handling of the above exception, another exception occurred:\n",
|
1207 |
+
"\u001b[0;31mOSError\u001b[0m Traceback (most recent call last)",
|
1208 |
+
"Cell \u001b[0;32mIn[26], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mpush_to_hub\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
|
1209 |
+
"File \u001b[0;32m~/.venv/lib/python3.8/site-packages/transformers/trainer.py:3492\u001b[0m, in \u001b[0;36mTrainer.push_to_hub\u001b[0;34m(self, commit_message, blocking, **kwargs)\u001b[0m\n\u001b[1;32m 3489\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpush_in_progress\u001b[38;5;241m.\u001b[39m_process\u001b[38;5;241m.\u001b[39mkill()\n\u001b[1;32m 3490\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpush_in_progress \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n\u001b[0;32m-> 3492\u001b[0m git_head_commit_url \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrepo\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mpush_to_hub\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 3493\u001b[0m \u001b[43m \u001b[49m\u001b[43mcommit_message\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcommit_message\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mblocking\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mblocking\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\n\u001b[1;32m 3494\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 3495\u001b[0m \u001b[38;5;66;03m# push separately the model card to be independant from the rest of the model\u001b[39;00m\n\u001b[1;32m 3496\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39margs\u001b[38;5;241m.\u001b[39mshould_save:\n",
|
1210 |
+
"File \u001b[0;32m~/.venv/lib/python3.8/site-packages/huggingface_hub/repository.py:1432\u001b[0m, in \u001b[0;36mRepository.push_to_hub\u001b[0;34m(self, commit_message, blocking, clean_ok, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1430\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgit_add(auto_lfs_track\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m)\n\u001b[1;32m 1431\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgit_commit(commit_message)\n\u001b[0;32m-> 1432\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mgit_push\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 1433\u001b[0m \u001b[43m \u001b[49m\u001b[43mupstream\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43mf\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43morigin \u001b[39;49m\u001b[38;5;132;43;01m{\u001b[39;49;00m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mcurrent_branch\u001b[49m\u001b[38;5;132;43;01m}\u001b[39;49;00m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1434\u001b[0m \u001b[43m \u001b[49m\u001b[43mblocking\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mblocking\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1435\u001b[0m \u001b[43m \u001b[49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mauto_lfs_prune\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 1436\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n",
|
1211 |
+
"File \u001b[0;32m~/.venv/lib/python3.8/site-packages/huggingface_hub/repository.py:1212\u001b[0m, in \u001b[0;36mRepository.git_push\u001b[0;34m(self, upstream, blocking, auto_lfs_prune)\u001b[0m\n\u001b[1;32m 1207\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError(\n\u001b[1;32m 1208\u001b[0m return_code, process\u001b[38;5;241m.\u001b[39margs, output\u001b[38;5;241m=\u001b[39mstdout, stderr\u001b[38;5;241m=\u001b[39mstderr\n\u001b[1;32m 1209\u001b[0m )\n\u001b[1;32m 1211\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m subprocess\u001b[38;5;241m.\u001b[39mCalledProcessError \u001b[38;5;28;01mas\u001b[39;00m exc:\n\u001b[0;32m-> 1212\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mEnvironmentError\u001b[39;00m(exc\u001b[38;5;241m.\u001b[39mstderr)\n\u001b[1;32m 1214\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m blocking:\n\u001b[1;32m 1216\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mstatus_method\u001b[39m():\n",
|
1212 |
+
"\u001b[0;31mOSError\u001b[0m: remote: Scanning LFS files for validity, may be slow... \nremote: LFS file scan complete. \nremote: ----------------------------------------------------------\u001b[0;31m \nremote: Sorry, your push was rejected during YAML metadata verification: \nremote: - Error: \"language[0]\" must only contain lowercase characters \nremote: - Error: \"language[0]\" with value \"zh-TW\" is not valid. It must be an ISO 639-1, 639-2 or 639-3 code (two/three letters), or a special value like \"code\", \"multilingual\". If you want to use BCP-47 identifiers, you can specify them in language_bcp47.\u001b[0;32m \nremote: ---------------------------------------------------------- \nremote: Please find the documentation at: \nremote: https://huggingface.co/docs/hub/model-cards#model-card-metadata\u001b[0;0m \nremote: ---------------------------------------------------------- \nTo https://huggingface.co/kimbochen/whisper-small-zh-tw\n ! [remote rejected] main -> main (pre-receive hook declined)\nerror: failed to push some refs to 'https://huggingface.co/kimbochen/whisper-small-zh-tw'\n"
|
1213 |
+
]
|
1214 |
}
|
1215 |
],
|
1216 |
"source": [
|