Training in progress, step 55240

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +135 -3
pytorch_model.bin +1 -1
runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:da5bf2849c0638ce07375012016d12ab0464f14c9ff2cc8e0d5c7f8102381be2
 size 2401461253

 version https://git-lfs.github.com/spec/v1
+oid sha256:4df6baefe0df3845a28abe9fc6e812fd755b1eb716adddecc1deedd7aca8278d
 size 2401461253

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:939362e3a8d757be29a23f167f4a01bd5557159122b0df243b3b2536127d8aac
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:612baa21561bf04530d6eb5804833e6f0b56599c78fd0a39bacd3ac335e650d3
 size 1200739717

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ac0761df5417402344ed3bf16bb6e3a45212b9c7f1bd6e2a6742f07a4b1bfc53
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:274f4675622b5854821912e67212d43584ebb6ec4a78ba0fa35ff9cd87e972c2
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cc1c6f6c18f2c362ea1ad3fddc44d9b0d7706c7038e53ba814ce42682079de6c
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:b09dba34704dde96f55673b0cc5c41d0a0ce45d83ad2015625ba94df43f96a45
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.6574038261283508,
-  "global_step": 44192,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -534,11 +534,143 @@
       "learning_rate": 1.5636349211071773e-05,
       "loss": 3.1734,
       "step": 44000
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
-  "total_flos": 5.193969669557453e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.8217547826604386,
+  "global_step": 55240,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.5636349211071773e-05,
       "loss": 3.1734,
       "step": 44000
+    },
+    {
+      "epoch": 0.66,
+      "learning_rate": 1.55867622702885e-05,
+      "loss": 3.1401,
+      "step": 44500
+    },
+    {
+      "epoch": 0.67,
+      "learning_rate": 1.5537175329505225e-05,
+      "loss": 3.1463,
+      "step": 45000
+    },
+    {
+      "epoch": 0.68,
+      "learning_rate": 1.5487588388721947e-05,
+      "loss": 3.1431,
+      "step": 45500
+    },
+    {
+      "epoch": 0.68,
+      "learning_rate": 1.5438001447938673e-05,
+      "loss": 3.1316,
+      "step": 46000
+    },
+    {
+      "epoch": 0.69,
+      "learning_rate": 1.5388414507155395e-05,
+      "loss": 3.1606,
+      "step": 46500
+    },
+    {
+      "epoch": 0.7,
+      "learning_rate": 1.533882756637212e-05,
+      "loss": 3.1362,
+      "step": 47000
+    },
+    {
+      "epoch": 0.71,
+      "learning_rate": 1.5289240625588847e-05,
+      "loss": 3.1335,
+      "step": 47500
+    },
+    {
+      "epoch": 0.71,
+      "learning_rate": 1.523965368480557e-05,
+      "loss": 3.149,
+      "step": 48000
+    },
+    {
+      "epoch": 0.72,
+      "learning_rate": 1.5190066744022297e-05,
+      "loss": 3.1293,
+      "step": 48500
+    },
+    {
+      "epoch": 0.73,
+      "learning_rate": 1.514047980323902e-05,
+      "loss": 3.1286,
+      "step": 49000
+    },
+    {
+      "epoch": 0.74,
+      "learning_rate": 1.5090892862455743e-05,
+      "loss": 3.1196,
+      "step": 49500
+    },
+    {
+      "epoch": 0.74,
+      "learning_rate": 1.5041305921672469e-05,
+      "loss": 3.1238,
+      "step": 50000
+    },
+    {
+      "epoch": 0.75,
+      "learning_rate": 1.4991718980889195e-05,
+      "loss": 3.1033,
+      "step": 50500
+    },
+    {
+      "epoch": 0.76,
+      "learning_rate": 1.4942132040105919e-05,
+      "loss": 3.1112,
+      "step": 51000
+    },
+    {
+      "epoch": 0.77,
+      "learning_rate": 1.4892545099322645e-05,
+      "loss": 3.0936,
+      "step": 51500
+    },
+    {
+      "epoch": 0.77,
+      "learning_rate": 1.4842958158539369e-05,
+      "loss": 3.107,
+      "step": 52000
+    },
+    {
+      "epoch": 0.78,
+      "learning_rate": 1.4793371217756094e-05,
+      "loss": 3.1063,
+      "step": 52500
+    },
+    {
+      "epoch": 0.79,
+      "learning_rate": 1.4743784276972817e-05,
+      "loss": 3.0639,
+      "step": 53000
+    },
+    {
+      "epoch": 0.8,
+      "learning_rate": 1.4694197336189543e-05,
+      "loss": 3.1028,
+      "step": 53500
+    },
+    {
+      "epoch": 0.8,
+      "learning_rate": 1.4644610395406267e-05,
+      "loss": 3.0821,
+      "step": 54000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 1.4595023454622992e-05,
+      "loss": 3.0596,
+      "step": 54500
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 1.4545436513839717e-05,
+      "loss": 3.0787,
+      "step": 55000
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
+  "total_flos": 6.497219068615066e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:939362e3a8d757be29a23f167f4a01bd5557159122b0df243b3b2536127d8aac
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:612baa21561bf04530d6eb5804833e6f0b56599c78fd0a39bacd3ac335e650d3
 size 1200739717

runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68abdf7d613e2b38ec76fd6735814e503c277a7e46fafb3f031724d696919bcd
-size 18101

 version https://git-lfs.github.com/spec/v1
+oid sha256:0b5afd134e7190bfca227464f177ede39b4d5a435161a2a45582286c96ae5885
+size 21621