huseinzol05
commited on
Commit
•
0445aa8
1
Parent(s):
9204f13
Upload evaluate-gpu.ipynb
Browse files- evaluate-gpu.ipynb +82 -99
evaluate-gpu.ipynb
CHANGED
@@ -158,19 +158,22 @@
|
|
158 |
{
|
159 |
"data": {
|
160 |
"text/plain": [
|
161 |
-
"[('
|
162 |
-
"
|
163 |
-
" ('singlish-test/
|
164 |
-
"
|
165 |
-
" ('singlish-test/
|
166 |
-
"
|
167 |
-
"
|
168 |
-
" ('singlish-test/
|
169 |
-
"
|
170 |
-
" ('singlish-test/
|
171 |
-
"
|
172 |
-
" ('
|
173 |
-
"
|
|
|
|
|
|
|
174 |
]
|
175 |
},
|
176 |
"execution_count": 8,
|
@@ -249,7 +252,7 @@
|
|
249 |
"outputs": [],
|
250 |
"source": [
|
251 |
"model = AutoModelForCTC.from_pretrained(\n",
|
252 |
-
" './wav2vec2-mixed-v3/checkpoint-
|
253 |
" ctc_loss_reduction=\"mean\",\n",
|
254 |
" pad_token_id=tokenizer.pad_token_id,\n",
|
255 |
" vocab_size=len(tokenizer),\n",
|
@@ -300,10 +303,10 @@
|
|
300 |
{
|
301 |
"data": {
|
302 |
"text/plain": [
|
303 |
-
"['
|
304 |
-
" '
|
305 |
-
" '
|
306 |
-
" '
|
307 |
]
|
308 |
},
|
309 |
"execution_count": 14,
|
@@ -359,10 +362,10 @@
|
|
359 |
"name": "stdout",
|
360 |
"output_type": "stream",
|
361 |
"text": [
|
362 |
-
"0
|
363 |
-
"1
|
364 |
-
"2
|
365 |
-
"3
|
366 |
]
|
367 |
}
|
368 |
],
|
@@ -382,10 +385,10 @@
|
|
382 |
{
|
383 |
"data": {
|
384 |
"text/plain": [
|
385 |
-
"['
|
386 |
-
" '
|
387 |
-
" '
|
388 |
-
" '
|
389 |
]
|
390 |
},
|
391 |
"execution_count": 18,
|
@@ -440,7 +443,7 @@
|
|
440 |
"name": "stderr",
|
441 |
"output_type": "stream",
|
442 |
"text": [
|
443 |
-
"100%|██████████| 1240/1240 [
|
444 |
]
|
445 |
}
|
446 |
],
|
@@ -478,20 +481,20 @@
|
|
478 |
},
|
479 |
{
|
480 |
"cell_type": "code",
|
481 |
-
"execution_count":
|
482 |
"id": "6c6ce8ef",
|
483 |
"metadata": {},
|
484 |
"outputs": [
|
485 |
{
|
486 |
"data": {
|
487 |
"text/plain": [
|
488 |
-
"(0.
|
489 |
-
" 0.
|
490 |
-
" 0.
|
491 |
-
" 0.
|
492 |
]
|
493 |
},
|
494 |
-
"execution_count":
|
495 |
"metadata": {},
|
496 |
"output_type": "execute_result"
|
497 |
}
|
@@ -502,7 +505,7 @@
|
|
502 |
},
|
503 |
{
|
504 |
"cell_type": "code",
|
505 |
-
"execution_count":
|
506 |
"id": "cf53914e",
|
507 |
"metadata": {},
|
508 |
"outputs": [],
|
@@ -514,20 +517,20 @@
|
|
514 |
},
|
515 |
{
|
516 |
"cell_type": "code",
|
517 |
-
"execution_count":
|
518 |
"id": "b1558987",
|
519 |
"metadata": {},
|
520 |
"outputs": [
|
521 |
{
|
522 |
"data": {
|
523 |
"text/plain": [
|
524 |
-
"(0.
|
525 |
-
" 0.
|
526 |
-
" 0.
|
527 |
-
" 0.
|
528 |
]
|
529 |
},
|
530 |
-
"execution_count":
|
531 |
"metadata": {},
|
532 |
"output_type": "execute_result"
|
533 |
}
|
@@ -538,20 +541,20 @@
|
|
538 |
},
|
539 |
{
|
540 |
"cell_type": "code",
|
541 |
-
"execution_count":
|
542 |
"id": "f340cde7",
|
543 |
"metadata": {},
|
544 |
"outputs": [
|
545 |
{
|
546 |
"data": {
|
547 |
"text/plain": [
|
548 |
-
"(0.
|
549 |
-
" 0.
|
550 |
-
" 0.
|
551 |
-
" 0.
|
552 |
]
|
553 |
},
|
554 |
-
"execution_count":
|
555 |
"metadata": {},
|
556 |
"output_type": "execute_result"
|
557 |
}
|
@@ -562,20 +565,20 @@
|
|
562 |
},
|
563 |
{
|
564 |
"cell_type": "code",
|
565 |
-
"execution_count":
|
566 |
"id": "cbc2539f",
|
567 |
"metadata": {},
|
568 |
"outputs": [
|
569 |
{
|
570 |
"data": {
|
571 |
"text/plain": [
|
572 |
-
"(0.
|
573 |
-
" 0.
|
574 |
-
" 0.
|
575 |
-
" 0.
|
576 |
]
|
577 |
},
|
578 |
-
"execution_count":
|
579 |
"metadata": {},
|
580 |
"output_type": "execute_result"
|
581 |
}
|
@@ -586,27 +589,14 @@
|
|
586 |
},
|
587 |
{
|
588 |
"cell_type": "code",
|
589 |
-
"execution_count":
|
590 |
"id": "4c543d0c",
|
591 |
"metadata": {},
|
592 |
"outputs": [
|
593 |
-
{
|
594 |
-
"name": "stderr",
|
595 |
-
"output_type": "stream",
|
596 |
-
"text": [
|
597 |
-
"/home/ubuntu/.local/lib/python3.8/site-packages/huggingface_hub/utils/_deprecation.py:39: FutureWarning: Pass token='wav2vec2-xls-r-300m-mixed' as keyword args. From version 0.7 passing these as positional arguments will result in an error\n",
|
598 |
-
" warnings.warn(\n",
|
599 |
-
"/home/ubuntu/.local/lib/python3.8/site-packages/huggingface_hub/hf_api.py:79: FutureWarning: `name` and `organization` input arguments are deprecated and will be removed in v0.7. Pass `repo_id` instead.\n",
|
600 |
-
" warnings.warn(\n",
|
601 |
-
"/home/ubuntu/.local/lib/python3.8/site-packages/huggingface_hub/hf_api.py:596: FutureWarning: `create_repo` now takes `token` as an optional positional argument. Be sure to adapt your code!\n",
|
602 |
-
" warnings.warn(\n",
|
603 |
-
"Cloning https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed into local empty directory.\n"
|
604 |
-
]
|
605 |
-
},
|
606 |
{
|
607 |
"data": {
|
608 |
"application/vnd.jupyter.widget-view+json": {
|
609 |
-
"model_id": "
|
610 |
"version_major": 2,
|
611 |
"version_minor": 0
|
612 |
},
|
@@ -624,17 +614,17 @@
|
|
624 |
"remote: Enforcing permissions... \n",
|
625 |
"remote: Allowed refs: all \n",
|
626 |
"To https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed\n",
|
627 |
-
"
|
628 |
"\n"
|
629 |
]
|
630 |
},
|
631 |
{
|
632 |
"data": {
|
633 |
"text/plain": [
|
634 |
-
"'https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed/commit/
|
635 |
]
|
636 |
},
|
637 |
-
"execution_count":
|
638 |
"metadata": {},
|
639 |
"output_type": "execute_result"
|
640 |
}
|
@@ -645,7 +635,7 @@
|
|
645 |
},
|
646 |
{
|
647 |
"cell_type": "code",
|
648 |
-
"execution_count":
|
649 |
"id": "05ec385e",
|
650 |
"metadata": {},
|
651 |
"outputs": [
|
@@ -653,24 +643,24 @@
|
|
653 |
"name": "stderr",
|
654 |
"output_type": "stream",
|
655 |
"text": [
|
656 |
-
"2022-06-01
|
657 |
-
"2022-06-01
|
658 |
-
"2022-06-01
|
659 |
-
"2022-06-01
|
660 |
"To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
|
661 |
-
"2022-06-01
|
662 |
-
"2022-06-01
|
663 |
-
"2022-06-01
|
664 |
-
"2022-06-01
|
665 |
-
"2022-06-01
|
666 |
-
"2022-06-01
|
667 |
-
"2022-06-01
|
668 |
-
"2022-06-01
|
669 |
"\n",
|
670 |
"TFWav2Vec2ForCTC has backpropagation operations that are NOT supported on CPU. If you wish to train/fine-tine this model, you need a GPU or a TPU\n",
|
671 |
-
"2022-06-01
|
672 |
-
"2022-06-01
|
673 |
-
"2022-06-01
|
674 |
"All PyTorch model weights were used when initializing TFWav2Vec2ForCTC.\n",
|
675 |
"\n",
|
676 |
"All the weights of TFWav2Vec2ForCTC were initialized from the PyTorch model.\n",
|
@@ -680,7 +670,7 @@
|
|
680 |
],
|
681 |
"source": [
|
682 |
"model_tf = TFWav2Vec2ForCTC.from_pretrained(\n",
|
683 |
-
" './wav2vec2-mixed-v3/checkpoint-
|
684 |
" ctc_loss_reduction=\"mean\",\n",
|
685 |
" pad_token_id=tokenizer.pad_token_id,\n",
|
686 |
" vocab_size=len(tokenizer),\n",
|
@@ -690,21 +680,14 @@
|
|
690 |
},
|
691 |
{
|
692 |
"cell_type": "code",
|
693 |
-
"execution_count":
|
694 |
"id": "e0f3f749",
|
695 |
"metadata": {},
|
696 |
"outputs": [
|
697 |
-
{
|
698 |
-
"name": "stderr",
|
699 |
-
"output_type": "stream",
|
700 |
-
"text": [
|
701 |
-
"2022-06-01 09:29:38.885075: W tensorflow/core/framework/cpu_allocator_impl.cc:80] Allocation of 33554432 exceeds 10% of free system memory.\n"
|
702 |
-
]
|
703 |
-
},
|
704 |
{
|
705 |
"data": {
|
706 |
"application/vnd.jupyter.widget-view+json": {
|
707 |
-
"model_id": "
|
708 |
"version_major": 2,
|
709 |
"version_minor": 0
|
710 |
},
|
@@ -722,17 +705,17 @@
|
|
722 |
"remote: Enforcing permissions... \n",
|
723 |
"remote: Allowed refs: all \n",
|
724 |
"To https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed\n",
|
725 |
-
"
|
726 |
"\n"
|
727 |
]
|
728 |
},
|
729 |
{
|
730 |
"data": {
|
731 |
"text/plain": [
|
732 |
-
"'https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed/commit/
|
733 |
]
|
734 |
},
|
735 |
-
"execution_count":
|
736 |
"metadata": {},
|
737 |
"output_type": "execute_result"
|
738 |
}
|
|
|
158 |
{
|
159 |
"data": {
|
160 |
"text/plain": [
|
161 |
+
"[('malay-test/101.wav',\n",
|
162 |
+
" 'kenapa jews dan israelis mengejek iranian bukan agama lebih'),\n",
|
163 |
+
" ('singlish-test/978.wav',\n",
|
164 |
+
" 'but in the olympics time does not really matter what matters is winning'),\n",
|
165 |
+
" ('singlish-test/1189.wav',\n",
|
166 |
+
" 'and if joseph schooling was born with a tinier hand he might not have hit the wall first'),\n",
|
167 |
+
" ('singlish-test/1774.wav', 'melissa passed her number to the young man'),\n",
|
168 |
+
" ('singlish-test/21.wav',\n",
|
169 |
+
" 'but he really wanted to make satay and hung around satay sellers and memorized their ingredients'),\n",
|
170 |
+
" ('singlish-test/2164.wav', 'just check out their coverage'),\n",
|
171 |
+
" ('malay-test/397.wav', 'budaya cocorico french culture'),\n",
|
172 |
+
" ('mandarin-test/359.wav', 'xi shou jian deng da kai'),\n",
|
173 |
+
" ('singlish-test/1107.wav',\n",
|
174 |
+
" 'the party had a cool vibe but was for guests only'),\n",
|
175 |
+
" ('singlish-test/285.wav',\n",
|
176 |
+
" 'but in smaller towns there are not so many places and that is where they are most needed')]"
|
177 |
]
|
178 |
},
|
179 |
"execution_count": 8,
|
|
|
252 |
"outputs": [],
|
253 |
"source": [
|
254 |
"model = AutoModelForCTC.from_pretrained(\n",
|
255 |
+
" './wav2vec2-mixed-v3/checkpoint-97000',\n",
|
256 |
" ctc_loss_reduction=\"mean\",\n",
|
257 |
" pad_token_id=tokenizer.pad_token_id,\n",
|
258 |
" vocab_size=len(tokenizer),\n",
|
|
|
303 |
{
|
304 |
"data": {
|
305 |
"text/plain": [
|
306 |
+
"['kenapa jius dan israelis mengejik iranian bukan agama lebih',\n",
|
307 |
+
" 'but in the olympics time does not really matter what matters is winning',\n",
|
308 |
+
" 'and if joseph schooling was born with a tinier hand he might not have hit the world first',\n",
|
309 |
+
" 'melissa passed her number to the young man']"
|
310 |
]
|
311 |
},
|
312 |
"execution_count": 14,
|
|
|
362 |
"name": "stdout",
|
363 |
"output_type": "stream",
|
364 |
"text": [
|
365 |
+
"0 kenapa jus dan israelis mengejek iranian bukan agama lebih\n",
|
366 |
+
"1 but in the olympics time does not really matter what matters is winning\n",
|
367 |
+
"2 and if joseph schooling was born with a tinier hand he might not have hit the world first\n",
|
368 |
+
"3 melissa passed her number to the young man\n"
|
369 |
]
|
370 |
}
|
371 |
],
|
|
|
385 |
{
|
386 |
"data": {
|
387 |
"text/plain": [
|
388 |
+
"['kenapa jews dan israelis mengejek iranian bukan agama lebih',\n",
|
389 |
+
" 'but in the olympics time does not really matter what matters is winning',\n",
|
390 |
+
" 'and if joseph schooling was born with a tinier hand he might not have hit the wall first',\n",
|
391 |
+
" 'melissa passed her number to the young man']"
|
392 |
]
|
393 |
},
|
394 |
"execution_count": 18,
|
|
|
443 |
"name": "stderr",
|
444 |
"output_type": "stream",
|
445 |
"text": [
|
446 |
+
"100%|██████████| 1240/1240 [07:43<00:00, 2.67it/s]\n"
|
447 |
]
|
448 |
}
|
449 |
],
|
|
|
481 |
},
|
482 |
{
|
483 |
"cell_type": "code",
|
484 |
+
"execution_count": 26,
|
485 |
"id": "6c6ce8ef",
|
486 |
"metadata": {},
|
487 |
"outputs": [
|
488 |
{
|
489 |
"data": {
|
490 |
"text/plain": [
|
491 |
+
"(0.12446419219809059,\n",
|
492 |
+
" 0.04363189219453221,\n",
|
493 |
+
" 0.09152993800218129,\n",
|
494 |
+
" 0.03621180629932558)"
|
495 |
]
|
496 |
},
|
497 |
+
"execution_count": 26,
|
498 |
"metadata": {},
|
499 |
"output_type": "execute_result"
|
500 |
}
|
|
|
505 |
},
|
506 |
{
|
507 |
"cell_type": "code",
|
508 |
+
"execution_count": 27,
|
509 |
"id": "cf53914e",
|
510 |
"metadata": {},
|
511 |
"outputs": [],
|
|
|
517 |
},
|
518 |
{
|
519 |
"cell_type": "code",
|
520 |
+
"execution_count": 28,
|
521 |
"id": "b1558987",
|
522 |
"metadata": {},
|
523 |
"outputs": [
|
524 |
{
|
525 |
"data": {
|
526 |
"text/plain": [
|
527 |
+
"(0.22565751242221832,\n",
|
528 |
+
" 0.053659683623049854,\n",
|
529 |
+
" 0.14256712242006359,\n",
|
530 |
+
" 0.036930421149001316)"
|
531 |
]
|
532 |
},
|
533 |
+
"execution_count": 28,
|
534 |
"metadata": {},
|
535 |
"output_type": "execute_result"
|
536 |
}
|
|
|
541 |
},
|
542 |
{
|
543 |
"cell_type": "code",
|
544 |
+
"execution_count": 29,
|
545 |
"id": "f340cde7",
|
546 |
"metadata": {},
|
547 |
"outputs": [
|
548 |
{
|
549 |
"data": {
|
550 |
"text/plain": [
|
551 |
+
"(0.10734402150682842,\n",
|
552 |
+
" 0.04174804195104746,\n",
|
553 |
+
" 0.08103191123663189,\n",
|
554 |
+
" 0.03538238462620066)"
|
555 |
]
|
556 |
},
|
557 |
+
"execution_count": 29,
|
558 |
"metadata": {},
|
559 |
"output_type": "execute_result"
|
560 |
}
|
|
|
565 |
},
|
566 |
{
|
567 |
"cell_type": "code",
|
568 |
+
"execution_count": 30,
|
569 |
"id": "cbc2539f",
|
570 |
"metadata": {},
|
571 |
"outputs": [
|
572 |
{
|
573 |
"data": {
|
574 |
"text/plain": [
|
575 |
+
"(0.09817787449869257,\n",
|
576 |
+
" 0.04211892733885779,\n",
|
577 |
+
" 0.08913415903511501,\n",
|
578 |
+
" 0.040151154521006656)"
|
579 |
]
|
580 |
},
|
581 |
+
"execution_count": 30,
|
582 |
"metadata": {},
|
583 |
"output_type": "execute_result"
|
584 |
}
|
|
|
589 |
},
|
590 |
{
|
591 |
"cell_type": "code",
|
592 |
+
"execution_count": 31,
|
593 |
"id": "4c543d0c",
|
594 |
"metadata": {},
|
595 |
"outputs": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
596 |
{
|
597 |
"data": {
|
598 |
"application/vnd.jupyter.widget-view+json": {
|
599 |
+
"model_id": "551516109d6a418b95be6884422d853e",
|
600 |
"version_major": 2,
|
601 |
"version_minor": 0
|
602 |
},
|
|
|
614 |
"remote: Enforcing permissions... \n",
|
615 |
"remote: Allowed refs: all \n",
|
616 |
"To https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed\n",
|
617 |
+
" 3f5d181..7799685 main -> main\n",
|
618 |
"\n"
|
619 |
]
|
620 |
},
|
621 |
{
|
622 |
"data": {
|
623 |
"text/plain": [
|
624 |
+
"'https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed/commit/77996855b40213396051061d8e23b67c2616e614'"
|
625 |
]
|
626 |
},
|
627 |
+
"execution_count": 31,
|
628 |
"metadata": {},
|
629 |
"output_type": "execute_result"
|
630 |
}
|
|
|
635 |
},
|
636 |
{
|
637 |
"cell_type": "code",
|
638 |
+
"execution_count": 32,
|
639 |
"id": "05ec385e",
|
640 |
"metadata": {},
|
641 |
"outputs": [
|
|
|
643 |
"name": "stderr",
|
644 |
"output_type": "stream",
|
645 |
"text": [
|
646 |
+
"2022-06-01 19:14:20.564262: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
647 |
+
"2022-06-01 19:14:20.603610: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
648 |
+
"2022-06-01 19:14:20.605395: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
649 |
+
"2022-06-01 19:14:20.607506: I tensorflow/core/platform/cpu_feature_guard.cc:142] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 AVX512F FMA\n",
|
650 |
"To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
|
651 |
+
"2022-06-01 19:14:20.609495: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
652 |
+
"2022-06-01 19:14:20.610833: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
653 |
+
"2022-06-01 19:14:20.612207: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
654 |
+
"2022-06-01 19:14:20.615738: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
655 |
+
"2022-06-01 19:14:20.617302: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
656 |
+
"2022-06-01 19:14:20.618707: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:937] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
|
657 |
+
"2022-06-01 19:14:20.620281: W tensorflow/core/common_runtime/gpu/gpu_bfc_allocator.cc:39] Overriding allow_growth setting because the TF_FORCE_GPU_ALLOW_GROWTH environment variable is set. Original config value was 0.\n",
|
658 |
+
"2022-06-01 19:14:20.620394: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1510] Created device /job:localhost/replica:0/task:0/device:GPU:0 with 17119 MB memory: -> device: 0, name: NVIDIA GeForce RTX 3090 Ti, pci bus id: 0000:01:00.0, compute capability: 8.6\n",
|
659 |
"\n",
|
660 |
"TFWav2Vec2ForCTC has backpropagation operations that are NOT supported on CPU. If you wish to train/fine-tine this model, you need a GPU or a TPU\n",
|
661 |
+
"2022-06-01 19:14:22.857691: I tensorflow/stream_executor/cuda/cuda_dnn.cc:369] Loaded cuDNN version 8100\n",
|
662 |
+
"2022-06-01 19:14:24.326073: I tensorflow/core/platform/default/subprocess.cc:304] Start cannot spawn child process: No such file or directory\n",
|
663 |
+
"2022-06-01 19:14:25.725870: I tensorflow/stream_executor/cuda/cuda_blas.cc:1760] TensorFloat-32 will be used for the matrix multiplication. This will only be logged once.\n",
|
664 |
"All PyTorch model weights were used when initializing TFWav2Vec2ForCTC.\n",
|
665 |
"\n",
|
666 |
"All the weights of TFWav2Vec2ForCTC were initialized from the PyTorch model.\n",
|
|
|
670 |
],
|
671 |
"source": [
|
672 |
"model_tf = TFWav2Vec2ForCTC.from_pretrained(\n",
|
673 |
+
" './wav2vec2-mixed-v3/checkpoint-97000',\n",
|
674 |
" ctc_loss_reduction=\"mean\",\n",
|
675 |
" pad_token_id=tokenizer.pad_token_id,\n",
|
676 |
" vocab_size=len(tokenizer),\n",
|
|
|
680 |
},
|
681 |
{
|
682 |
"cell_type": "code",
|
683 |
+
"execution_count": 33,
|
684 |
"id": "e0f3f749",
|
685 |
"metadata": {},
|
686 |
"outputs": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
687 |
{
|
688 |
"data": {
|
689 |
"application/vnd.jupyter.widget-view+json": {
|
690 |
+
"model_id": "a0e5eeee5bf4499da3d5f4adbd5bfd4f",
|
691 |
"version_major": 2,
|
692 |
"version_minor": 0
|
693 |
},
|
|
|
705 |
"remote: Enforcing permissions... \n",
|
706 |
"remote: Allowed refs: all \n",
|
707 |
"To https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed\n",
|
708 |
+
" 7799685..0b9b0fb main -> main\n",
|
709 |
"\n"
|
710 |
]
|
711 |
},
|
712 |
{
|
713 |
"data": {
|
714 |
"text/plain": [
|
715 |
+
"'https://huggingface.co/mesolitica/wav2vec2-xls-r-300m-mixed/commit/0b9b0fb66dc68a4f71ab793274fb28df9f19764f'"
|
716 |
]
|
717 |
},
|
718 |
+
"execution_count": 33,
|
719 |
"metadata": {},
|
720 |
"output_type": "execute_result"
|
721 |
}
|