Training in progress, epoch 59, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79b71bf8526feaf3fbe640362c921c3bd5d9b567af82dd4997d42973aa321991
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c277767943f1e035c0d73c794bfd2e290cf536330fec91bf85bb7c955776135f
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7021b7f290ce2ecee8960d7d8842b39007015ec1c207fbea7eb79b547a00e6ea
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbb398868d9495d1d98703c67e6d962238241ad82fc84d6f95dd75ff664b33ec
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.22530820965766907,
|
3 |
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-25000",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -8277,6 +8277,151 @@
|
|
8277 |
"eval_samples_per_second": 10.168,
|
8278 |
"eval_steps_per_second": 1.322,
|
8279 |
"step": 29000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8280 |
}
|
8281 |
],
|
8282 |
"logging_steps": 30,
|
@@ -8296,7 +8441,7 @@
|
|
8296 |
"attributes": {}
|
8297 |
}
|
8298 |
},
|
8299 |
-
"total_flos":
|
8300 |
"train_batch_size": 2,
|
8301 |
"trial_name": null,
|
8302 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.22530820965766907,
|
3 |
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-25000",
|
4 |
+
"epoch": 59.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 29500,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
8277 |
"eval_samples_per_second": 10.168,
|
8278 |
"eval_steps_per_second": 1.322,
|
8279 |
"step": 29000
|
8280 |
+
},
|
8281 |
+
{
|
8282 |
+
"epoch": 58.02,
|
8283 |
+
"grad_norm": 31.76934242248535,
|
8284 |
+
"learning_rate": 2.684594004283836e-08,
|
8285 |
+
"loss": 0.2661,
|
8286 |
+
"step": 29010
|
8287 |
+
},
|
8288 |
+
{
|
8289 |
+
"epoch": 58.08,
|
8290 |
+
"grad_norm": 33.10856628417969,
|
8291 |
+
"learning_rate": 2.5244915093499134e-08,
|
8292 |
+
"loss": 0.2613,
|
8293 |
+
"step": 29040
|
8294 |
+
},
|
8295 |
+
{
|
8296 |
+
"epoch": 58.14,
|
8297 |
+
"grad_norm": 54.95156478881836,
|
8298 |
+
"learning_rate": 2.3692988968458398e-08,
|
8299 |
+
"loss": 0.3306,
|
8300 |
+
"step": 29070
|
8301 |
+
},
|
8302 |
+
{
|
8303 |
+
"epoch": 58.2,
|
8304 |
+
"grad_norm": 50.21295928955078,
|
8305 |
+
"learning_rate": 2.219017698460002e-08,
|
8306 |
+
"loss": 0.2639,
|
8307 |
+
"step": 29100
|
8308 |
+
},
|
8309 |
+
{
|
8310 |
+
"epoch": 58.26,
|
8311 |
+
"grad_norm": 34.72473907470703,
|
8312 |
+
"learning_rate": 2.0736493974071736e-08,
|
8313 |
+
"loss": 0.2776,
|
8314 |
+
"step": 29130
|
8315 |
+
},
|
8316 |
+
{
|
8317 |
+
"epoch": 58.32,
|
8318 |
+
"grad_norm": 47.885765075683594,
|
8319 |
+
"learning_rate": 1.9331954284137476e-08,
|
8320 |
+
"loss": 0.2702,
|
8321 |
+
"step": 29160
|
8322 |
+
},
|
8323 |
+
{
|
8324 |
+
"epoch": 58.38,
|
8325 |
+
"grad_norm": 48.69330978393555,
|
8326 |
+
"learning_rate": 1.7976571777038044e-08,
|
8327 |
+
"loss": 0.2764,
|
8328 |
+
"step": 29190
|
8329 |
+
},
|
8330 |
+
{
|
8331 |
+
"epoch": 58.44,
|
8332 |
+
"grad_norm": 48.01133728027344,
|
8333 |
+
"learning_rate": 1.6670359829850657e-08,
|
8334 |
+
"loss": 0.2787,
|
8335 |
+
"step": 29220
|
8336 |
+
},
|
8337 |
+
{
|
8338 |
+
"epoch": 58.5,
|
8339 |
+
"grad_norm": 38.076595306396484,
|
8340 |
+
"learning_rate": 1.541333133436018e-08,
|
8341 |
+
"loss": 0.3156,
|
8342 |
+
"step": 29250
|
8343 |
+
},
|
8344 |
+
{
|
8345 |
+
"epoch": 58.56,
|
8346 |
+
"grad_norm": 77.71937561035156,
|
8347 |
+
"learning_rate": 1.4205498696930332e-08,
|
8348 |
+
"loss": 0.2821,
|
8349 |
+
"step": 29280
|
8350 |
+
},
|
8351 |
+
{
|
8352 |
+
"epoch": 58.62,
|
8353 |
+
"grad_norm": 69.0176010131836,
|
8354 |
+
"learning_rate": 1.3046873838381546e-08,
|
8355 |
+
"loss": 0.2954,
|
8356 |
+
"step": 29310
|
8357 |
+
},
|
8358 |
+
{
|
8359 |
+
"epoch": 58.68,
|
8360 |
+
"grad_norm": 43.61737823486328,
|
8361 |
+
"learning_rate": 1.1937468193873869e-08,
|
8362 |
+
"loss": 0.2688,
|
8363 |
+
"step": 29340
|
8364 |
+
},
|
8365 |
+
{
|
8366 |
+
"epoch": 58.74,
|
8367 |
+
"grad_norm": 48.39431381225586,
|
8368 |
+
"learning_rate": 1.0877292712792586e-08,
|
8369 |
+
"loss": 0.2566,
|
8370 |
+
"step": 29370
|
8371 |
+
},
|
8372 |
+
{
|
8373 |
+
"epoch": 58.8,
|
8374 |
+
"grad_norm": 66.10430908203125,
|
8375 |
+
"learning_rate": 9.866357858642206e-09,
|
8376 |
+
"loss": 0.2634,
|
8377 |
+
"step": 29400
|
8378 |
+
},
|
8379 |
+
{
|
8380 |
+
"epoch": 58.86,
|
8381 |
+
"grad_norm": 147.0448760986328,
|
8382 |
+
"learning_rate": 8.904673608940983e-09,
|
8383 |
+
"loss": 0.3025,
|
8384 |
+
"step": 29430
|
8385 |
+
},
|
8386 |
+
{
|
8387 |
+
"epoch": 58.92,
|
8388 |
+
"grad_norm": 52.136348724365234,
|
8389 |
+
"learning_rate": 7.992249455124889e-09,
|
8390 |
+
"loss": 0.3041,
|
8391 |
+
"step": 29460
|
8392 |
+
},
|
8393 |
+
{
|
8394 |
+
"epoch": 58.98,
|
8395 |
+
"grad_norm": 63.46728515625,
|
8396 |
+
"learning_rate": 7.129094402451575e-09,
|
8397 |
+
"loss": 0.2693,
|
8398 |
+
"step": 29490
|
8399 |
+
},
|
8400 |
+
{
|
8401 |
+
"epoch": 59.0,
|
8402 |
+
"eval_loss": 0.2272312492132187,
|
8403 |
+
"eval_map": 0.8302,
|
8404 |
+
"eval_map_50": 0.9765,
|
8405 |
+
"eval_map_75": 0.9394,
|
8406 |
+
"eval_map_chicken": 0.8148,
|
8407 |
+
"eval_map_duck": 0.8005,
|
8408 |
+
"eval_map_large": 0.9097,
|
8409 |
+
"eval_map_medium": 0.8372,
|
8410 |
+
"eval_map_plant": 0.8752,
|
8411 |
+
"eval_map_small": 0.3768,
|
8412 |
+
"eval_mar_1": 0.3092,
|
8413 |
+
"eval_mar_10": 0.8633,
|
8414 |
+
"eval_mar_100": 0.8673,
|
8415 |
+
"eval_mar_100_chicken": 0.852,
|
8416 |
+
"eval_mar_100_duck": 0.832,
|
8417 |
+
"eval_mar_100_plant": 0.9179,
|
8418 |
+
"eval_mar_large": 0.9469,
|
8419 |
+
"eval_mar_medium": 0.8825,
|
8420 |
+
"eval_mar_small": 0.4523,
|
8421 |
+
"eval_runtime": 10.2822,
|
8422 |
+
"eval_samples_per_second": 9.726,
|
8423 |
+
"eval_steps_per_second": 1.264,
|
8424 |
+
"step": 29500
|
8425 |
}
|
8426 |
],
|
8427 |
"logging_steps": 30,
|
|
|
8441 |
"attributes": {}
|
8442 |
}
|
8443 |
},
|
8444 |
+
"total_flos": 1.01486818308096e+19,
|
8445 |
"train_batch_size": 2,
|
8446 |
"trial_name": null,
|
8447 |
"trial_params": null
|