Training in progress, epoch 148, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a47898b6387ef2cfdf4a2494cac6d643001aa350b662f1ca1cff6c6341846cae
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fd2c0a7bf22601834502a8f53f12a6d808f34646649b87e6eb1f54f7f0d7f05
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:622595e15d8d4adca4c438019feffee921460c3fc84414d13543954d20d79148
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:426b4b133f941dbc1b63fbe118d222c9115fbe2fd29b895828a7fd399389ce5d
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.29718613624572754,
|
3 |
"best_model_checkpoint": "chickens-composite-201616161616-150-epochs-wo-transform-metrics-test-shfld/checkpoint-49500",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -20979,6 +20979,144 @@
|
|
20979 |
"eval_samples_per_second": 15.477,
|
20980 |
"eval_steps_per_second": 2.012,
|
20981 |
"step": 73500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
20982 |
}
|
20983 |
],
|
20984 |
"logging_steps": 30,
|
@@ -20998,7 +21136,7 @@
|
|
20998 |
"attributes": {}
|
20999 |
}
|
21000 |
},
|
21001 |
-
"total_flos": 2.
|
21002 |
"train_batch_size": 2,
|
21003 |
"trial_name": null,
|
21004 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.29718613624572754,
|
3 |
"best_model_checkpoint": "chickens-composite-201616161616-150-epochs-wo-transform-metrics-test-shfld/checkpoint-49500",
|
4 |
+
"epoch": 148.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 74000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
20979 |
"eval_samples_per_second": 15.477,
|
20980 |
"eval_steps_per_second": 2.012,
|
20981 |
"step": 73500
|
20982 |
+
},
|
20983 |
+
{
|
20984 |
+
"epoch": 147.06,
|
20985 |
+
"grad_norm": 48.93723678588867,
|
20986 |
+
"learning_rate": 9.475773543818345e-09,
|
20987 |
+
"loss": 0.2219,
|
20988 |
+
"step": 73530
|
20989 |
+
},
|
20990 |
+
{
|
20991 |
+
"epoch": 147.12,
|
20992 |
+
"grad_norm": 57.43806076049805,
|
20993 |
+
"learning_rate": 9.09306994793635e-09,
|
20994 |
+
"loss": 0.2339,
|
20995 |
+
"step": 73560
|
20996 |
+
},
|
20997 |
+
{
|
20998 |
+
"epoch": 147.18,
|
20999 |
+
"grad_norm": 73.41053009033203,
|
21000 |
+
"learning_rate": 8.718247675337243e-09,
|
21001 |
+
"loss": 0.1919,
|
21002 |
+
"step": 73590
|
21003 |
+
},
|
21004 |
+
{
|
21005 |
+
"epoch": 147.24,
|
21006 |
+
"grad_norm": 77.83393096923828,
|
21007 |
+
"learning_rate": 8.351307317917002e-09,
|
21008 |
+
"loss": 0.204,
|
21009 |
+
"step": 73620
|
21010 |
+
},
|
21011 |
+
{
|
21012 |
+
"epoch": 147.3,
|
21013 |
+
"grad_norm": 54.583885192871094,
|
21014 |
+
"learning_rate": 7.992249455124889e-09,
|
21015 |
+
"loss": 0.2176,
|
21016 |
+
"step": 73650
|
21017 |
+
},
|
21018 |
+
{
|
21019 |
+
"epoch": 147.36,
|
21020 |
+
"grad_norm": 33.40181350708008,
|
21021 |
+
"learning_rate": 7.641074653961244e-09,
|
21022 |
+
"loss": 0.2189,
|
21023 |
+
"step": 73680
|
21024 |
+
},
|
21025 |
+
{
|
21026 |
+
"epoch": 147.42,
|
21027 |
+
"grad_norm": 16.970766067504883,
|
21028 |
+
"learning_rate": 7.297783468980246e-09,
|
21029 |
+
"loss": 0.2093,
|
21030 |
+
"step": 73710
|
21031 |
+
},
|
21032 |
+
{
|
21033 |
+
"epoch": 147.48,
|
21034 |
+
"grad_norm": 48.121337890625,
|
21035 |
+
"learning_rate": 6.962376442284368e-09,
|
21036 |
+
"loss": 0.2144,
|
21037 |
+
"step": 73740
|
21038 |
+
},
|
21039 |
+
{
|
21040 |
+
"epoch": 147.54,
|
21041 |
+
"grad_norm": 57.12207794189453,
|
21042 |
+
"learning_rate": 6.63485410352771e-09,
|
21043 |
+
"loss": 0.2085,
|
21044 |
+
"step": 73770
|
21045 |
+
},
|
21046 |
+
{
|
21047 |
+
"epoch": 147.6,
|
21048 |
+
"grad_norm": 92.21527099609375,
|
21049 |
+
"learning_rate": 6.315216969912663e-09,
|
21050 |
+
"loss": 0.1927,
|
21051 |
+
"step": 73800
|
21052 |
+
},
|
21053 |
+
{
|
21054 |
+
"epoch": 147.66,
|
21055 |
+
"grad_norm": 33.92885208129883,
|
21056 |
+
"learning_rate": 6.003465546189358e-09,
|
21057 |
+
"loss": 0.2022,
|
21058 |
+
"step": 73830
|
21059 |
+
},
|
21060 |
+
{
|
21061 |
+
"epoch": 147.72,
|
21062 |
+
"grad_norm": 45.98738479614258,
|
21063 |
+
"learning_rate": 5.699600324657328e-09,
|
21064 |
+
"loss": 0.1957,
|
21065 |
+
"step": 73860
|
21066 |
+
},
|
21067 |
+
{
|
21068 |
+
"epoch": 147.78,
|
21069 |
+
"grad_norm": 80.80580139160156,
|
21070 |
+
"learning_rate": 5.403621785159407e-09,
|
21071 |
+
"loss": 0.2206,
|
21072 |
+
"step": 73890
|
21073 |
+
},
|
21074 |
+
{
|
21075 |
+
"epoch": 147.84,
|
21076 |
+
"grad_norm": 38.10297393798828,
|
21077 |
+
"learning_rate": 5.115530395087276e-09,
|
21078 |
+
"loss": 0.211,
|
21079 |
+
"step": 73920
|
21080 |
+
},
|
21081 |
+
{
|
21082 |
+
"epoch": 147.9,
|
21083 |
+
"grad_norm": 61.57286071777344,
|
21084 |
+
"learning_rate": 4.835326609376468e-09,
|
21085 |
+
"loss": 0.2167,
|
21086 |
+
"step": 73950
|
21087 |
+
},
|
21088 |
+
{
|
21089 |
+
"epoch": 147.96,
|
21090 |
+
"grad_norm": 37.9475212097168,
|
21091 |
+
"learning_rate": 4.5630108705063684e-09,
|
21092 |
+
"loss": 0.19,
|
21093 |
+
"step": 73980
|
21094 |
+
},
|
21095 |
+
{
|
21096 |
+
"epoch": 148.0,
|
21097 |
+
"eval_loss": 0.3058013916015625,
|
21098 |
+
"eval_map": 0.8044,
|
21099 |
+
"eval_map_50": 0.9405,
|
21100 |
+
"eval_map_75": 0.9024,
|
21101 |
+
"eval_map_chicken": 0.7936,
|
21102 |
+
"eval_map_duck": 0.7475,
|
21103 |
+
"eval_map_large": 0.7843,
|
21104 |
+
"eval_map_medium": 0.8141,
|
21105 |
+
"eval_map_plant": 0.8722,
|
21106 |
+
"eval_map_small": 0.2979,
|
21107 |
+
"eval_mar_1": 0.3221,
|
21108 |
+
"eval_mar_10": 0.8382,
|
21109 |
+
"eval_mar_100": 0.8419,
|
21110 |
+
"eval_mar_100_chicken": 0.844,
|
21111 |
+
"eval_mar_100_duck": 0.7804,
|
21112 |
+
"eval_mar_100_plant": 0.9012,
|
21113 |
+
"eval_mar_large": 0.8145,
|
21114 |
+
"eval_mar_medium": 0.8546,
|
21115 |
+
"eval_mar_small": 0.3829,
|
21116 |
+
"eval_runtime": 6.6213,
|
21117 |
+
"eval_samples_per_second": 15.103,
|
21118 |
+
"eval_steps_per_second": 1.963,
|
21119 |
+
"step": 74000
|
21120 |
}
|
21121 |
],
|
21122 |
"logging_steps": 30,
|
|
|
21136 |
"attributes": {}
|
21137 |
}
|
21138 |
},
|
21139 |
+
"total_flos": 2.54577103552512e+19,
|
21140 |
"train_batch_size": 2,
|
21141 |
"trial_name": null,
|
21142 |
"trial_params": null
|