joe611 commited on
Commit
45dd777
1 Parent(s): 0be084f

Training in progress, epoch 148, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de0075c09765f4217cb4598585d60460dff05ad3e0e7e110b00dcc6cc35df35f
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a47898b6387ef2cfdf4a2494cac6d643001aa350b662f1ca1cff6c6341846cae
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae21a489ed46c86157d9abebc2ebce7ee2cf5d70cc339aa20c63463b1dec1a1c
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fd2c0a7bf22601834502a8f53f12a6d808f34646649b87e6eb1f54f7f0d7f05
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c307610f491951f0cf2efdd73180e72af7240ce4aa6a43b10a13ac774ffd0e4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:622595e15d8d4adca4c438019feffee921460c3fc84414d13543954d20d79148
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85f02b07cdec64767b23910029cd704b2c6b794d3aac44d543a26849f5211b68
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:426b4b133f941dbc1b63fbe118d222c9115fbe2fd29b895828a7fd399389ce5d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.29718613624572754,
3
  "best_model_checkpoint": "chickens-composite-201616161616-150-epochs-wo-transform-metrics-test-shfld/checkpoint-49500",
4
- "epoch": 147.0,
5
  "eval_steps": 500,
6
- "global_step": 73500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -20979,6 +20979,144 @@
20979
  "eval_samples_per_second": 15.477,
20980
  "eval_steps_per_second": 2.012,
20981
  "step": 73500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20982
  }
20983
  ],
20984
  "logging_steps": 30,
@@ -20998,7 +21136,7 @@
20998
  "attributes": {}
20999
  }
21000
  },
21001
- "total_flos": 2.52856987987968e+19,
21002
  "train_batch_size": 2,
21003
  "trial_name": null,
21004
  "trial_params": null
 
1
  {
2
  "best_metric": 0.29718613624572754,
3
  "best_model_checkpoint": "chickens-composite-201616161616-150-epochs-wo-transform-metrics-test-shfld/checkpoint-49500",
4
+ "epoch": 148.0,
5
  "eval_steps": 500,
6
+ "global_step": 74000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
20979
  "eval_samples_per_second": 15.477,
20980
  "eval_steps_per_second": 2.012,
20981
  "step": 73500
20982
+ },
20983
+ {
20984
+ "epoch": 147.06,
20985
+ "grad_norm": 48.93723678588867,
20986
+ "learning_rate": 9.475773543818345e-09,
20987
+ "loss": 0.2219,
20988
+ "step": 73530
20989
+ },
20990
+ {
20991
+ "epoch": 147.12,
20992
+ "grad_norm": 57.43806076049805,
20993
+ "learning_rate": 9.09306994793635e-09,
20994
+ "loss": 0.2339,
20995
+ "step": 73560
20996
+ },
20997
+ {
20998
+ "epoch": 147.18,
20999
+ "grad_norm": 73.41053009033203,
21000
+ "learning_rate": 8.718247675337243e-09,
21001
+ "loss": 0.1919,
21002
+ "step": 73590
21003
+ },
21004
+ {
21005
+ "epoch": 147.24,
21006
+ "grad_norm": 77.83393096923828,
21007
+ "learning_rate": 8.351307317917002e-09,
21008
+ "loss": 0.204,
21009
+ "step": 73620
21010
+ },
21011
+ {
21012
+ "epoch": 147.3,
21013
+ "grad_norm": 54.583885192871094,
21014
+ "learning_rate": 7.992249455124889e-09,
21015
+ "loss": 0.2176,
21016
+ "step": 73650
21017
+ },
21018
+ {
21019
+ "epoch": 147.36,
21020
+ "grad_norm": 33.40181350708008,
21021
+ "learning_rate": 7.641074653961244e-09,
21022
+ "loss": 0.2189,
21023
+ "step": 73680
21024
+ },
21025
+ {
21026
+ "epoch": 147.42,
21027
+ "grad_norm": 16.970766067504883,
21028
+ "learning_rate": 7.297783468980246e-09,
21029
+ "loss": 0.2093,
21030
+ "step": 73710
21031
+ },
21032
+ {
21033
+ "epoch": 147.48,
21034
+ "grad_norm": 48.121337890625,
21035
+ "learning_rate": 6.962376442284368e-09,
21036
+ "loss": 0.2144,
21037
+ "step": 73740
21038
+ },
21039
+ {
21040
+ "epoch": 147.54,
21041
+ "grad_norm": 57.12207794189453,
21042
+ "learning_rate": 6.63485410352771e-09,
21043
+ "loss": 0.2085,
21044
+ "step": 73770
21045
+ },
21046
+ {
21047
+ "epoch": 147.6,
21048
+ "grad_norm": 92.21527099609375,
21049
+ "learning_rate": 6.315216969912663e-09,
21050
+ "loss": 0.1927,
21051
+ "step": 73800
21052
+ },
21053
+ {
21054
+ "epoch": 147.66,
21055
+ "grad_norm": 33.92885208129883,
21056
+ "learning_rate": 6.003465546189358e-09,
21057
+ "loss": 0.2022,
21058
+ "step": 73830
21059
+ },
21060
+ {
21061
+ "epoch": 147.72,
21062
+ "grad_norm": 45.98738479614258,
21063
+ "learning_rate": 5.699600324657328e-09,
21064
+ "loss": 0.1957,
21065
+ "step": 73860
21066
+ },
21067
+ {
21068
+ "epoch": 147.78,
21069
+ "grad_norm": 80.80580139160156,
21070
+ "learning_rate": 5.403621785159407e-09,
21071
+ "loss": 0.2206,
21072
+ "step": 73890
21073
+ },
21074
+ {
21075
+ "epoch": 147.84,
21076
+ "grad_norm": 38.10297393798828,
21077
+ "learning_rate": 5.115530395087276e-09,
21078
+ "loss": 0.211,
21079
+ "step": 73920
21080
+ },
21081
+ {
21082
+ "epoch": 147.9,
21083
+ "grad_norm": 61.57286071777344,
21084
+ "learning_rate": 4.835326609376468e-09,
21085
+ "loss": 0.2167,
21086
+ "step": 73950
21087
+ },
21088
+ {
21089
+ "epoch": 147.96,
21090
+ "grad_norm": 37.9475212097168,
21091
+ "learning_rate": 4.5630108705063684e-09,
21092
+ "loss": 0.19,
21093
+ "step": 73980
21094
+ },
21095
+ {
21096
+ "epoch": 148.0,
21097
+ "eval_loss": 0.3058013916015625,
21098
+ "eval_map": 0.8044,
21099
+ "eval_map_50": 0.9405,
21100
+ "eval_map_75": 0.9024,
21101
+ "eval_map_chicken": 0.7936,
21102
+ "eval_map_duck": 0.7475,
21103
+ "eval_map_large": 0.7843,
21104
+ "eval_map_medium": 0.8141,
21105
+ "eval_map_plant": 0.8722,
21106
+ "eval_map_small": 0.2979,
21107
+ "eval_mar_1": 0.3221,
21108
+ "eval_mar_10": 0.8382,
21109
+ "eval_mar_100": 0.8419,
21110
+ "eval_mar_100_chicken": 0.844,
21111
+ "eval_mar_100_duck": 0.7804,
21112
+ "eval_mar_100_plant": 0.9012,
21113
+ "eval_mar_large": 0.8145,
21114
+ "eval_mar_medium": 0.8546,
21115
+ "eval_mar_small": 0.3829,
21116
+ "eval_runtime": 6.6213,
21117
+ "eval_samples_per_second": 15.103,
21118
+ "eval_steps_per_second": 1.963,
21119
+ "step": 74000
21120
  }
21121
  ],
21122
  "logging_steps": 30,
 
21136
  "attributes": {}
21137
  }
21138
  },
21139
+ "total_flos": 2.54577103552512e+19,
21140
  "train_batch_size": 2,
21141
  "trial_name": null,
21142
  "trial_params": null