vitouphy
/

wav2vec2-xls-r-300m-khmer

@@ -3,7 +3,7 @@
   {
    "cell_type": "code",
    "execution_count": 1,
-   "id": "15d904e9",
    "metadata": {
     "collapsed": true,
     "jupyter": {
@@ -708,7 +708,7 @@
   {
    "cell_type": "code",
    "execution_count": 2,
-   "id": "68c81e1e",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -721,7 +721,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "b5f4cca5",
    "metadata": {
     "collapsed": true,
     "jupyter": {
@@ -13484,7 +13484,7 @@
   {
    "cell_type": "code",
    "execution_count": 3,
-   "id": "9b57c68d",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13505,7 +13505,7 @@
   {
    "cell_type": "code",
    "execution_count": 32,
-   "id": "6371aacf",
    "metadata": {},
    "outputs": [
     {
@@ -13527,7 +13527,7 @@
   {
    "cell_type": "code",
    "execution_count": 33,
-   "id": "214624ba",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13542,7 +13542,7 @@
   {
    "cell_type": "code",
    "execution_count": 6,
-   "id": "0c890a5b",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13558,7 +13558,7 @@
   {
    "cell_type": "code",
    "execution_count": 7,
-   "id": "9ad59bfe",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13570,7 +13570,7 @@
   {
    "cell_type": "code",
    "execution_count": 8,
-   "id": "d0b3000d",
    "metadata": {},
    "outputs": [
     {
@@ -13592,7 +13592,7 @@
   {
    "cell_type": "code",
    "execution_count": 9,
-   "id": "3067a0d2",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13602,7 +13602,7 @@
   {
    "cell_type": "code",
    "execution_count": 34,
-   "id": "be87dadf",
    "metadata": {},
    "outputs": [
     {
@@ -13650,7 +13650,7 @@
   {
    "cell_type": "code",
    "execution_count": 35,
-   "id": "42e56c1e",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13661,7 +13661,7 @@
   {
    "cell_type": "code",
    "execution_count": 36,
-   "id": "dc7ff75c",
    "metadata": {},
    "outputs": [
     {
@@ -13679,7 +13679,7 @@
   {
    "cell_type": "code",
    "execution_count": 37,
-   "id": "8132901b",
    "metadata": {},
    "outputs": [
     {
@@ -13706,7 +13706,7 @@
   {
    "cell_type": "code",
    "execution_count": 38,
-   "id": "501e426e",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13718,7 +13718,7 @@
   {
    "cell_type": "code",
    "execution_count": 39,
-   "id": "8ea339c9",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13728,7 +13728,7 @@
   {
    "cell_type": "code",
    "execution_count": 40,
-   "id": "98633ad2",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13740,7 +13740,7 @@
   {
    "cell_type": "code",
    "execution_count": 41,
-   "id": "1ec1e98a",
    "metadata": {},
    "outputs": [
     {
@@ -13761,7 +13761,7 @@
   {
    "cell_type": "code",
    "execution_count": 26,
-   "id": "9fdebef6",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13778,7 +13778,7 @@
   {
    "cell_type": "code",
    "execution_count": 27,
-   "id": "c6c32f96",
    "metadata": {},
    "outputs": [
     {
@@ -13818,7 +13818,7 @@
   {
    "cell_type": "code",
    "execution_count": 48,
-   "id": "fb722007",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13829,7 +13829,7 @@
   {
    "cell_type": "code",
    "execution_count": 50,
-   "id": "11558fd2",
    "metadata": {},
    "outputs": [
     {
@@ -13854,7 +13854,7 @@
   {
    "cell_type": "code",
    "execution_count": 51,
-   "id": "12c81313",
    "metadata": {},
    "outputs": [
     {
@@ -13901,7 +13901,7 @@
   {
    "cell_type": "code",
    "execution_count": 52,
-   "id": "1cb97a7e",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13923,7 +13923,7 @@
   {
    "cell_type": "code",
    "execution_count": 53,
-   "id": "d7bd14b2",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13934,7 +13934,7 @@
   {
    "cell_type": "code",
    "execution_count": 41,
-   "id": "00c75e3c",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -13946,7 +13946,7 @@
   {
    "cell_type": "code",
    "execution_count": 54,
-   "id": "8906918e",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -14005,7 +14005,7 @@
   {
    "cell_type": "code",
    "execution_count": 55,
-   "id": "40ff3940",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -14015,7 +14015,7 @@
   {
    "cell_type": "code",
    "execution_count": 56,
-   "id": "2a579f5a",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -14026,7 +14026,7 @@
   {
    "cell_type": "code",
    "execution_count": 57,
-   "id": "221d53c7",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -14050,7 +14050,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "87cf1d87",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -14060,7 +14060,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "d8afce23",
    "metadata": {},
    "outputs": [],
    "source": []
@@ -14068,7 +14068,7 @@
   {
    "cell_type": "code",
    "execution_count": 58,
-   "id": "22a21f3f",
    "metadata": {},
    "outputs": [
     {
@@ -14102,7 +14102,7 @@
   {
    "cell_type": "code",
    "execution_count": 59,
-   "id": "1688901e",
    "metadata": {},
    "outputs": [
     {
@@ -14120,10 +14120,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 60,
-   "id": "e13830f8",
    "metadata": {},
-   "outputs": [],
    "source": [
     "from transformers import TrainingArguments\n",
     "\n",
@@ -14136,8 +14145,8 @@
     "  gradient_checkpointing=True,\n",
     "  fp16=True,\n",
     "  num_train_epochs=30,\n",
-    "  save_steps=100,\n",
-    "  eval_steps=100,\n",
     "  logging_steps=100,\n",
     "  learning_rate=3e-5,\n",
     "  warmup_steps=500,\n",
@@ -14148,8 +14157,8 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 63,
-   "id": "2a405bb3",
    "metadata": {},
    "outputs": [
     {
@@ -14178,7 +14187,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "e9a99c77",
    "metadata": {},
    "outputs": [
     {
@@ -14203,8 +14212,8 @@
        "\n",
        "    <div>\n",
        "      \n",
-       "      <progress value='101' max='4890' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
-       "      [ 101/4890 01:40 < 1:21:11, 0.98 it/s, Epoch 0.61/30]\n",
        "    </div>\n",
        "    <table border=\"1\" class=\"dataframe\">\n",
        "  <thead>\n",
@@ -14217,8 +14226,8 @@
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
-       "      <td>100</td>\n",
-       "      <td>16.976400</td>\n",
        "      <td>13.300326</td>\n",
        "      <td>0.989265</td>\n",
        "    </tr>\n",
@@ -14240,8 +14249,11 @@
       "***** Running Evaluation *****\n",
       "  Num examples = 291\n",
       "  Batch size = 8\n",
-      "Saving model checkpoint to ./checkpoint-100\n",
-      "Configuration saved in ./checkpoint-100/config.json\n"
      ]
     }
    ],
@@ -14252,7 +14264,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "3629e75f",
    "metadata": {},
    "outputs": [],
    "source": []

   {
    "cell_type": "code",
    "execution_count": 1,
+   "id": "3ae82d97",
    "metadata": {
     "collapsed": true,
     "jupyter": {
   {
    "cell_type": "code",
    "execution_count": 2,
+   "id": "5082f3ca",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": null,
+   "id": "c5838f22",
    "metadata": {
     "collapsed": true,
     "jupyter": {
   {
    "cell_type": "code",
    "execution_count": 3,
+   "id": "94fea955",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 32,
+   "id": "0bdb4556",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 33,
+   "id": "d6645c93",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 6,
+   "id": "b64fe901",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 7,
+   "id": "65867ef2",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 8,
+   "id": "beca9fac",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 9,
+   "id": "d679de6c",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 34,
+   "id": "eb92b2d5",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 35,
+   "id": "7b8296e6",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 36,
+   "id": "78dc9b6c",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 37,
+   "id": "0f856602",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 38,
+   "id": "c5f41740",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 39,
+   "id": "b750d9cf",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 40,
+   "id": "e3f563c7",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 41,
+   "id": "8dd37836",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 26,
+   "id": "8868a601",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 27,
+   "id": "3503046d",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 48,
+   "id": "895f3bfb",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 50,
+   "id": "e5515c8d",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 51,
+   "id": "450c5c90",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 52,
+   "id": "b10b6aa1",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 53,
+   "id": "a1776bef",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 41,
+   "id": "8eea6563",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 54,
+   "id": "f15bec0a",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 55,
+   "id": "d30dafe4",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 56,
+   "id": "408bcb4d",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": 57,
+   "id": "e5573fd8",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": null,
+   "id": "da8c34ad",
    "metadata": {},
    "outputs": [],
    "source": [
   {
    "cell_type": "code",
    "execution_count": null,
+   "id": "229b8ebf",
    "metadata": {},
    "outputs": [],
    "source": []
   {
    "cell_type": "code",
    "execution_count": 58,
+   "id": "7b36eee5",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": 59,
+   "id": "7ec46eca",
    "metadata": {},
    "outputs": [
     {
   },
   {
    "cell_type": "code",
+   "execution_count": 65,
+   "id": "9db5b382",
    "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "PyTorch: setting up devices\n",
+      "The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).\n"
+     ]
+    }
+   ],
    "source": [
     "from transformers import TrainingArguments\n",
     "\n",
     "  gradient_checkpointing=True,\n",
     "  fp16=True,\n",
     "  num_train_epochs=30,\n",
+    "  save_steps=1,\n",
+    "  eval_steps=1,\n",
     "  logging_steps=100,\n",
     "  learning_rate=3e-5,\n",
     "  warmup_steps=500,\n",
   },
   {
    "cell_type": "code",
+   "execution_count": 66,
+   "id": "96c9aeb9",
    "metadata": {},
    "outputs": [
     {
   {
    "cell_type": "code",
    "execution_count": null,
+   "id": "a3a38848",
    "metadata": {},
    "outputs": [
     {
        "\n",
        "    <div>\n",
        "      \n",
+       "      <progress value='2' max='4890' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+       "      [   2/4890 : < :, Epoch 0.01/30]\n",
        "    </div>\n",
        "    <table border=\"1\" class=\"dataframe\">\n",
        "  <thead>\n",
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
+       "      <td>1</td>\n",
+       "      <td>No log</td>\n",
        "      <td>13.300326</td>\n",
        "      <td>0.989265</td>\n",
        "    </tr>\n",
       "***** Running Evaluation *****\n",
       "  Num examples = 291\n",
       "  Batch size = 8\n",
+      "Saving model checkpoint to ./checkpoint-1\n",
+      "Configuration saved in ./checkpoint-1/config.json\n",
+      "Model weights saved in ./checkpoint-1/pytorch_model.bin\n",
+      "Configuration saved in ./checkpoint-1/preprocessor_config.json\n",
+      "Configuration saved in ./preprocessor_config.json\n"
      ]
     }
    ],
   {
    "cell_type": "code",
    "execution_count": null,
+   "id": "e27620ac",
    "metadata": {},
    "outputs": [],
    "source": []

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f53351c36f9166d72fba05a26550d456156793a4caab264b38fc1e6437cf34a8
 size 2991

 version https://git-lfs.github.com/spec/v1
+oid sha256:9b35c85cfceecf16b9f8a4306c6c419ed33469f21c8e3b016a95fdbbcd87ddbb
 size 2991