joe611 commited on
Commit
5d9e46c
1 Parent(s): 35c0887

Training in progress, epoch 59, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b392aff3a6ab84e321c0da912a52394cdf80c96d908bc82cd18229c180b3a16a
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79b71bf8526feaf3fbe640362c921c3bd5d9b567af82dd4997d42973aa321991
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd9a916036f1c4feb33e98f71780fdaa5eecd9c63d4096c79d97b0f84384125c
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c277767943f1e035c0d73c794bfd2e290cf536330fec91bf85bb7c955776135f
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a728912d3338c692b48d80b79e8160131e5fa9d986b207c5ffb9444c99eab6bc
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7021b7f290ce2ecee8960d7d8842b39007015ec1c207fbea7eb79b547a00e6ea
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d91fda77405c63be9ba69cfebcac04e28133f651f301ae840d5c36ddddb1529b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbb398868d9495d1d98703c67e6d962238241ad82fc84d6f95dd75ff664b33ec
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.22530820965766907,
3
  "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-25000",
4
- "epoch": 58.0,
5
  "eval_steps": 500,
6
- "global_step": 29000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -8277,6 +8277,151 @@
8277
  "eval_samples_per_second": 10.168,
8278
  "eval_steps_per_second": 1.322,
8279
  "step": 29000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8280
  }
8281
  ],
8282
  "logging_steps": 30,
@@ -8296,7 +8441,7 @@
8296
  "attributes": {}
8297
  }
8298
  },
8299
- "total_flos": 9.9766702743552e+18,
8300
  "train_batch_size": 2,
8301
  "trial_name": null,
8302
  "trial_params": null
 
1
  {
2
  "best_metric": 0.22530820965766907,
3
  "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-25000",
4
+ "epoch": 59.0,
5
  "eval_steps": 500,
6
+ "global_step": 29500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
8277
  "eval_samples_per_second": 10.168,
8278
  "eval_steps_per_second": 1.322,
8279
  "step": 29000
8280
+ },
8281
+ {
8282
+ "epoch": 58.02,
8283
+ "grad_norm": 31.76934242248535,
8284
+ "learning_rate": 2.684594004283836e-08,
8285
+ "loss": 0.2661,
8286
+ "step": 29010
8287
+ },
8288
+ {
8289
+ "epoch": 58.08,
8290
+ "grad_norm": 33.10856628417969,
8291
+ "learning_rate": 2.5244915093499134e-08,
8292
+ "loss": 0.2613,
8293
+ "step": 29040
8294
+ },
8295
+ {
8296
+ "epoch": 58.14,
8297
+ "grad_norm": 54.95156478881836,
8298
+ "learning_rate": 2.3692988968458398e-08,
8299
+ "loss": 0.3306,
8300
+ "step": 29070
8301
+ },
8302
+ {
8303
+ "epoch": 58.2,
8304
+ "grad_norm": 50.21295928955078,
8305
+ "learning_rate": 2.219017698460002e-08,
8306
+ "loss": 0.2639,
8307
+ "step": 29100
8308
+ },
8309
+ {
8310
+ "epoch": 58.26,
8311
+ "grad_norm": 34.72473907470703,
8312
+ "learning_rate": 2.0736493974071736e-08,
8313
+ "loss": 0.2776,
8314
+ "step": 29130
8315
+ },
8316
+ {
8317
+ "epoch": 58.32,
8318
+ "grad_norm": 47.885765075683594,
8319
+ "learning_rate": 1.9331954284137476e-08,
8320
+ "loss": 0.2702,
8321
+ "step": 29160
8322
+ },
8323
+ {
8324
+ "epoch": 58.38,
8325
+ "grad_norm": 48.69330978393555,
8326
+ "learning_rate": 1.7976571777038044e-08,
8327
+ "loss": 0.2764,
8328
+ "step": 29190
8329
+ },
8330
+ {
8331
+ "epoch": 58.44,
8332
+ "grad_norm": 48.01133728027344,
8333
+ "learning_rate": 1.6670359829850657e-08,
8334
+ "loss": 0.2787,
8335
+ "step": 29220
8336
+ },
8337
+ {
8338
+ "epoch": 58.5,
8339
+ "grad_norm": 38.076595306396484,
8340
+ "learning_rate": 1.541333133436018e-08,
8341
+ "loss": 0.3156,
8342
+ "step": 29250
8343
+ },
8344
+ {
8345
+ "epoch": 58.56,
8346
+ "grad_norm": 77.71937561035156,
8347
+ "learning_rate": 1.4205498696930332e-08,
8348
+ "loss": 0.2821,
8349
+ "step": 29280
8350
+ },
8351
+ {
8352
+ "epoch": 58.62,
8353
+ "grad_norm": 69.0176010131836,
8354
+ "learning_rate": 1.3046873838381546e-08,
8355
+ "loss": 0.2954,
8356
+ "step": 29310
8357
+ },
8358
+ {
8359
+ "epoch": 58.68,
8360
+ "grad_norm": 43.61737823486328,
8361
+ "learning_rate": 1.1937468193873869e-08,
8362
+ "loss": 0.2688,
8363
+ "step": 29340
8364
+ },
8365
+ {
8366
+ "epoch": 58.74,
8367
+ "grad_norm": 48.39431381225586,
8368
+ "learning_rate": 1.0877292712792586e-08,
8369
+ "loss": 0.2566,
8370
+ "step": 29370
8371
+ },
8372
+ {
8373
+ "epoch": 58.8,
8374
+ "grad_norm": 66.10430908203125,
8375
+ "learning_rate": 9.866357858642206e-09,
8376
+ "loss": 0.2634,
8377
+ "step": 29400
8378
+ },
8379
+ {
8380
+ "epoch": 58.86,
8381
+ "grad_norm": 147.0448760986328,
8382
+ "learning_rate": 8.904673608940983e-09,
8383
+ "loss": 0.3025,
8384
+ "step": 29430
8385
+ },
8386
+ {
8387
+ "epoch": 58.92,
8388
+ "grad_norm": 52.136348724365234,
8389
+ "learning_rate": 7.992249455124889e-09,
8390
+ "loss": 0.3041,
8391
+ "step": 29460
8392
+ },
8393
+ {
8394
+ "epoch": 58.98,
8395
+ "grad_norm": 63.46728515625,
8396
+ "learning_rate": 7.129094402451575e-09,
8397
+ "loss": 0.2693,
8398
+ "step": 29490
8399
+ },
8400
+ {
8401
+ "epoch": 59.0,
8402
+ "eval_loss": 0.2272312492132187,
8403
+ "eval_map": 0.8302,
8404
+ "eval_map_50": 0.9765,
8405
+ "eval_map_75": 0.9394,
8406
+ "eval_map_chicken": 0.8148,
8407
+ "eval_map_duck": 0.8005,
8408
+ "eval_map_large": 0.9097,
8409
+ "eval_map_medium": 0.8372,
8410
+ "eval_map_plant": 0.8752,
8411
+ "eval_map_small": 0.3768,
8412
+ "eval_mar_1": 0.3092,
8413
+ "eval_mar_10": 0.8633,
8414
+ "eval_mar_100": 0.8673,
8415
+ "eval_mar_100_chicken": 0.852,
8416
+ "eval_mar_100_duck": 0.832,
8417
+ "eval_mar_100_plant": 0.9179,
8418
+ "eval_mar_large": 0.9469,
8419
+ "eval_mar_medium": 0.8825,
8420
+ "eval_mar_small": 0.4523,
8421
+ "eval_runtime": 10.2822,
8422
+ "eval_samples_per_second": 9.726,
8423
+ "eval_steps_per_second": 1.264,
8424
+ "step": 29500
8425
  }
8426
  ],
8427
  "logging_steps": 30,
 
8441
  "attributes": {}
8442
  }
8443
  },
8444
+ "total_flos": 1.01486818308096e+19,
8445
  "train_batch_size": 2,
8446
  "trial_name": null,
8447
  "trial_params": null