sheldonxxxx
commited on
Commit
•
87a52da
1
Parent(s):
14eac22
Training in progress, epoch 13
Browse files
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 688420485
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f417101f3829c73aa98b5cac6a7bfb363cf14ba833a4150f7aad14aa54dce3de
|
3 |
size 688420485
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 376157625
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32a8ff0d797e86a3413589649412f2436742fa1ad824b4911f2aa9830e542a52
|
3 |
size 376157625
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbbc2976c7f5ed05e81508b93621172099d62990182d65f94b3dd6d6bd00a274
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c52c096d4450959874eef46bbae98499f9cedad94c8b123c153d513137e7da05
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "/tmp/mecha-tagger/checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -222,11 +222,28 @@
|
|
222 |
"eval_samples_per_second": 50.179,
|
223 |
"eval_steps_per_second": 0.526,
|
224 |
"step": 1452
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
225 |
}
|
226 |
],
|
227 |
"max_steps": 6050,
|
228 |
"num_train_epochs": 50,
|
229 |
-
"total_flos": 6.
|
230 |
"trial_name": null,
|
231 |
"trial_params": null
|
232 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.5472163817533595,
|
3 |
+
"best_model_checkpoint": "/tmp/mecha-tagger/checkpoint-1573",
|
4 |
+
"epoch": 13.0,
|
5 |
+
"global_step": 1573,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
222 |
"eval_samples_per_second": 50.179,
|
223 |
"eval_steps_per_second": 0.526,
|
224 |
"step": 1452
|
225 |
+
},
|
226 |
+
{
|
227 |
+
"epoch": 12.4,
|
228 |
+
"learning_rate": 2e-05,
|
229 |
+
"loss": 0.2281,
|
230 |
+
"step": 1500
|
231 |
+
},
|
232 |
+
{
|
233 |
+
"epoch": 13.0,
|
234 |
+
"eval_accuracy": 0.07023670935195964,
|
235 |
+
"eval_f1": 0.5472163817533595,
|
236 |
+
"eval_loss": 0.2586032450199127,
|
237 |
+
"eval_roc_auc": 0.6994249977444085,
|
238 |
+
"eval_runtime": 51.2515,
|
239 |
+
"eval_samples_per_second": 50.281,
|
240 |
+
"eval_steps_per_second": 0.527,
|
241 |
+
"step": 1573
|
242 |
}
|
243 |
],
|
244 |
"max_steps": 6050,
|
245 |
"num_train_epochs": 50,
|
246 |
+
"total_flos": 6.882242130850185e+19,
|
247 |
"trial_name": null,
|
248 |
"trial_params": null
|
249 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 376157625
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32a8ff0d797e86a3413589649412f2436742fa1ad824b4911f2aa9830e542a52
|
3 |
size 376157625
|