mijungkim commited on
Commit
251564b
1 Parent(s): afaa0e0

End of training

Browse files
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 21.28,
3
- "eval_accuracy": 0.9908389585342333,
4
- "eval_f1": 0.9868823000898472,
5
- "eval_loss": 0.05581057444214821,
6
- "eval_precision": 0.9845822875582646,
7
  "eval_recall": 0.989193083573487,
8
- "eval_runtime": 15.2739,
9
  "eval_samples": 189,
10
- "eval_samples_per_second": 12.374,
11
- "eval_steps_per_second": 0.786,
12
- "train_loss": 0.1608761215209961,
13
- "train_runtime": 1880.5995,
14
  "train_samples": 752,
15
- "train_samples_per_second": 8.508,
16
- "train_steps_per_second": 0.532
17
  }
 
1
  {
2
  "epoch": 21.28,
3
+ "eval_accuracy": 0.9905978784956606,
4
+ "eval_f1": 0.9879474725670084,
5
+ "eval_loss": 0.058533914387226105,
6
+ "eval_precision": 0.986704994610133,
7
  "eval_recall": 0.989193083573487,
8
+ "eval_runtime": 13.9248,
9
  "eval_samples": 189,
10
+ "eval_samples_per_second": 13.573,
11
+ "eval_steps_per_second": 0.862,
12
+ "train_loss": 0.16068801975250244,
13
+ "train_runtime": 1757.2853,
14
  "train_samples": 752,
15
+ "train_samples_per_second": 9.105,
16
+ "train_steps_per_second": 0.569
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 21.28,
3
- "eval_accuracy": 0.9908389585342333,
4
- "eval_f1": 0.9868823000898472,
5
- "eval_loss": 0.05581057444214821,
6
- "eval_precision": 0.9845822875582646,
7
  "eval_recall": 0.989193083573487,
8
- "eval_runtime": 15.2739,
9
  "eval_samples": 189,
10
- "eval_samples_per_second": 12.374,
11
- "eval_steps_per_second": 0.786
12
  }
 
1
  {
2
  "epoch": 21.28,
3
+ "eval_accuracy": 0.9905978784956606,
4
+ "eval_f1": 0.9879474725670084,
5
+ "eval_loss": 0.058533914387226105,
6
+ "eval_precision": 0.986704994610133,
7
  "eval_recall": 0.989193083573487,
8
+ "eval_runtime": 13.9248,
9
  "eval_samples": 189,
10
+ "eval_samples_per_second": 13.573,
11
+ "eval_steps_per_second": 0.862
12
  }
runs/Dec20_22-54-58_pod-pasha/events.out.tfevents.1671578896.pod-pasha.546411.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f1f54c44016fdcb07e7ab4264c1d91bc832540bcb358903a19844908e93caed
3
+ size 512
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 21.28,
3
- "train_loss": 0.1608761215209961,
4
- "train_runtime": 1880.5995,
5
  "train_samples": 752,
6
- "train_samples_per_second": 8.508,
7
- "train_steps_per_second": 0.532
8
  }
 
1
  {
2
  "epoch": 21.28,
3
+ "train_loss": 0.16068801975250244,
4
+ "train_runtime": 1757.2853,
5
  "train_samples": 752,
6
+ "train_samples_per_second": 9.105,
7
+ "train_steps_per_second": 0.569
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9868823000898472,
3
- "best_model_checkpoint": "pasha/checkpoint-1000",
4
  "epoch": 21.27659574468085,
5
  "global_step": 1000,
6
  "is_hyper_param_search": false,
@@ -9,144 +9,144 @@
9
  "log_history": [
10
  {
11
  "epoch": 2.13,
12
- "eval_accuracy": 0.9566055930568949,
13
- "eval_f1": 0.9482633863965269,
14
- "eval_loss": 0.2661653161048889,
15
- "eval_precision": 0.9523982558139535,
16
- "eval_recall": 0.944164265129683,
17
- "eval_runtime": 15.4131,
18
- "eval_samples_per_second": 12.262,
19
- "eval_steps_per_second": 0.779,
20
  "step": 100
21
  },
22
  {
23
  "epoch": 4.26,
24
- "eval_accuracy": 0.9850530376084861,
25
- "eval_f1": 0.9795185052102047,
26
- "eval_loss": 0.1026068776845932,
27
- "eval_precision": 0.9770609318996416,
28
- "eval_recall": 0.9819884726224783,
29
- "eval_runtime": 15.204,
30
- "eval_samples_per_second": 12.431,
31
- "eval_steps_per_second": 0.789,
32
  "step": 200
33
  },
34
  {
35
  "epoch": 6.38,
36
- "eval_accuracy": 0.9884281581485053,
37
- "eval_f1": 0.9849137931034483,
38
- "eval_loss": 0.07217290997505188,
39
- "eval_precision": 0.9820916905444126,
40
- "eval_recall": 0.9877521613832853,
41
- "eval_runtime": 15.2143,
42
- "eval_samples_per_second": 12.423,
43
- "eval_steps_per_second": 0.789,
44
  "step": 300
45
  },
46
  {
47
  "epoch": 8.51,
48
- "eval_accuracy": 0.9891513982642237,
49
- "eval_f1": 0.9857785778577858,
50
- "eval_loss": 0.060767240822315216,
51
- "eval_precision": 0.9852464915437208,
52
- "eval_recall": 0.9863112391930836,
53
- "eval_runtime": 15.3275,
54
- "eval_samples_per_second": 12.331,
55
- "eval_steps_per_second": 0.783,
56
  "step": 400
57
  },
58
  {
59
  "epoch": 10.64,
60
  "learning_rate": 5e-06,
61
- "loss": 0.2962,
62
  "step": 500
63
  },
64
  {
65
  "epoch": 10.64,
66
- "eval_accuracy": 0.9889103182256509,
67
- "eval_f1": 0.9854185418541853,
68
- "eval_loss": 0.060581281781196594,
69
- "eval_precision": 0.9848866498740554,
70
- "eval_recall": 0.9859510086455331,
71
- "eval_runtime": 14.8027,
72
- "eval_samples_per_second": 12.768,
73
- "eval_steps_per_second": 0.811,
74
  "step": 500
75
  },
76
  {
77
  "epoch": 12.77,
78
- "eval_accuracy": 0.9920443587270974,
79
- "eval_f1": 0.988501616960115,
80
- "eval_loss": 0.0517994724214077,
81
- "eval_precision": 0.986021505376344,
82
- "eval_recall": 0.9909942363112392,
83
- "eval_runtime": 14.7335,
84
- "eval_samples_per_second": 12.828,
85
- "eval_steps_per_second": 0.814,
86
  "step": 600
87
  },
88
  {
89
  "epoch": 14.89,
90
- "eval_accuracy": 0.9922854387656702,
91
- "eval_f1": 0.988679245283019,
92
- "eval_loss": 0.052589546889066696,
93
- "eval_precision": 0.9863750448189316,
94
- "eval_recall": 0.9909942363112392,
95
- "eval_runtime": 14.9339,
96
- "eval_samples_per_second": 12.656,
97
- "eval_steps_per_second": 0.804,
98
  "step": 700
99
  },
100
  {
101
  "epoch": 17.02,
102
  "eval_accuracy": 0.991321118611379,
103
- "eval_f1": 0.9872416891284815,
104
- "eval_loss": 0.05428989231586456,
105
- "eval_precision": 0.984940839010398,
106
- "eval_recall": 0.9895533141210374,
107
- "eval_runtime": 14.8022,
108
- "eval_samples_per_second": 12.768,
109
- "eval_steps_per_second": 0.811,
110
  "step": 800
111
  },
112
  {
113
  "epoch": 19.15,
114
- "eval_accuracy": 0.9910800385728061,
115
- "eval_f1": 0.9867002156721782,
116
- "eval_loss": 0.05573796480894089,
117
- "eval_precision": 0.9845767575322812,
118
- "eval_recall": 0.9888328530259366,
119
- "eval_runtime": 14.7741,
120
- "eval_samples_per_second": 12.793,
121
- "eval_steps_per_second": 0.812,
122
  "step": 900
123
  },
124
  {
125
  "epoch": 21.28,
126
  "learning_rate": 0.0,
127
- "loss": 0.0255,
128
  "step": 1000
129
  },
130
  {
131
  "epoch": 21.28,
132
- "eval_accuracy": 0.9908389585342333,
133
- "eval_f1": 0.9868823000898472,
134
- "eval_loss": 0.05581057444214821,
135
- "eval_precision": 0.9845822875582646,
136
- "eval_recall": 0.989193083573487,
137
- "eval_runtime": 15.103,
138
- "eval_samples_per_second": 12.514,
139
- "eval_steps_per_second": 0.795,
140
  "step": 1000
141
  },
142
  {
143
  "epoch": 21.28,
144
  "step": 1000,
145
  "total_flos": 4247054450688000.0,
146
- "train_loss": 0.1608761215209961,
147
- "train_runtime": 1880.5995,
148
- "train_samples_per_second": 8.508,
149
- "train_steps_per_second": 0.532
150
  }
151
  ],
152
  "max_steps": 1000,
 
1
  {
2
+ "best_metric": 0.9879474725670084,
3
+ "best_model_checkpoint": "pasha/checkpoint-500",
4
  "epoch": 21.27659574468085,
5
  "global_step": 1000,
6
  "is_hyper_param_search": false,
 
9
  "log_history": [
10
  {
11
  "epoch": 2.13,
12
+ "eval_accuracy": 0.9570877531340405,
13
+ "eval_f1": 0.9485879797248371,
14
+ "eval_loss": 0.2664182484149933,
15
+ "eval_precision": 0.9534206695778749,
16
+ "eval_recall": 0.9438040345821326,
17
+ "eval_runtime": 13.9899,
18
+ "eval_samples_per_second": 13.51,
19
+ "eval_steps_per_second": 0.858,
20
  "step": 100
21
  },
22
  {
23
  "epoch": 4.26,
24
+ "eval_accuracy": 0.983847637415622,
25
+ "eval_f1": 0.9778975741239893,
26
+ "eval_loss": 0.10435084253549576,
27
+ "eval_precision": 0.9756185012549301,
28
+ "eval_recall": 0.9801873198847262,
29
+ "eval_runtime": 13.823,
30
+ "eval_samples_per_second": 13.673,
31
+ "eval_steps_per_second": 0.868,
32
  "step": 200
33
  },
34
  {
35
  "epoch": 6.38,
36
+ "eval_accuracy": 0.9903567984570878,
37
+ "eval_f1": 0.987601078167116,
38
+ "eval_loss": 0.06718672811985016,
39
+ "eval_precision": 0.9852993904625313,
40
+ "eval_recall": 0.9899135446685879,
41
+ "eval_runtime": 13.9839,
42
+ "eval_samples_per_second": 13.516,
43
+ "eval_steps_per_second": 0.858,
44
  "step": 300
45
  },
46
  {
47
  "epoch": 8.51,
48
+ "eval_accuracy": 0.9884281581485053,
49
+ "eval_f1": 0.9841783531103919,
50
+ "eval_loss": 0.06342343986034393,
51
+ "eval_precision": 0.9824120603015075,
52
+ "eval_recall": 0.9859510086455331,
53
+ "eval_runtime": 13.8826,
54
+ "eval_samples_per_second": 13.614,
55
+ "eval_steps_per_second": 0.864,
56
  "step": 400
57
  },
58
  {
59
  "epoch": 10.64,
60
  "learning_rate": 5e-06,
61
+ "loss": 0.2958,
62
  "step": 500
63
  },
64
  {
65
  "epoch": 10.64,
66
+ "eval_accuracy": 0.9905978784956606,
67
+ "eval_f1": 0.9879474725670084,
68
+ "eval_loss": 0.058533914387226105,
69
+ "eval_precision": 0.986704994610133,
70
+ "eval_recall": 0.989193083573487,
71
+ "eval_runtime": 13.739,
72
+ "eval_samples_per_second": 13.756,
73
+ "eval_steps_per_second": 0.873,
74
  "step": 500
75
  },
76
  {
77
  "epoch": 12.77,
78
+ "eval_accuracy": 0.9927675988428158,
79
+ "eval_f1": 0.9908322847384505,
80
+ "eval_loss": 0.051136456429958344,
81
+ "eval_precision": 0.9888769285970578,
82
+ "eval_recall": 0.9927953890489913,
83
+ "eval_runtime": 14.0393,
84
+ "eval_samples_per_second": 13.462,
85
+ "eval_steps_per_second": 0.855,
86
  "step": 600
87
  },
88
  {
89
  "epoch": 14.89,
90
+ "eval_accuracy": 0.992526518804243,
91
+ "eval_f1": 0.9895795903701042,
92
+ "eval_loss": 0.05025022476911545,
93
+ "eval_precision": 0.9870967741935484,
94
+ "eval_recall": 0.9920749279538905,
95
+ "eval_runtime": 14.0132,
96
+ "eval_samples_per_second": 13.487,
97
+ "eval_steps_per_second": 0.856,
98
  "step": 700
99
  },
100
  {
101
  "epoch": 17.02,
102
  "eval_accuracy": 0.991321118611379,
103
+ "eval_f1": 0.9881380301941048,
104
+ "eval_loss": 0.05291323363780975,
105
+ "eval_precision": 0.9860114777618364,
106
+ "eval_recall": 0.9902737752161384,
107
+ "eval_runtime": 13.9493,
108
+ "eval_samples_per_second": 13.549,
109
+ "eval_steps_per_second": 0.86,
110
  "step": 800
111
  },
112
  {
113
  "epoch": 19.15,
114
+ "eval_accuracy": 0.9903567984570878,
115
+ "eval_f1": 0.986704994610133,
116
+ "eval_loss": 0.0581122450530529,
117
+ "eval_precision": 0.9842293906810036,
118
+ "eval_recall": 0.989193083573487,
119
+ "eval_runtime": 13.9545,
120
+ "eval_samples_per_second": 13.544,
121
+ "eval_steps_per_second": 0.86,
122
  "step": 900
123
  },
124
  {
125
  "epoch": 21.28,
126
  "learning_rate": 0.0,
127
+ "loss": 0.0256,
128
  "step": 1000
129
  },
130
  {
131
  "epoch": 21.28,
132
+ "eval_accuracy": 0.990115718418515,
133
+ "eval_f1": 0.9868775840373899,
134
+ "eval_loss": 0.057054802775382996,
135
+ "eval_precision": 0.984930032292788,
136
+ "eval_recall": 0.9888328530259366,
137
+ "eval_runtime": 14.2093,
138
+ "eval_samples_per_second": 13.301,
139
+ "eval_steps_per_second": 0.845,
140
  "step": 1000
141
  },
142
  {
143
  "epoch": 21.28,
144
  "step": 1000,
145
  "total_flos": 4247054450688000.0,
146
+ "train_loss": 0.16068801975250244,
147
+ "train_runtime": 1757.2853,
148
+ "train_samples_per_second": 9.105,
149
+ "train_steps_per_second": 0.569
150
  }
151
  ],
152
  "max_steps": 1000,