File size: 5,931 Bytes
7e270f3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
{
  "best_metric": 0.13342921435832977,
  "best_model_checkpoint": "/home/dongyeop/owan0002/revision-preference/code/preference_classifier/coedit_t5/output_r1_iter_wo_p/checkpoint-405",
  "epoch": 20.0,
  "global_step": 540,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.9953,
      "eval_loss": 0.2727777659893036,
      "eval_runtime": 10.2846,
      "eval_samples_per_second": 164.517,
      "eval_steps_per_second": 1.361,
      "step": 27
    },
    {
      "epoch": 2.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.6791,
      "eval_loss": 0.26499590277671814,
      "eval_runtime": 9.934,
      "eval_samples_per_second": 170.324,
      "eval_steps_per_second": 1.409,
      "step": 54
    },
    {
      "epoch": 3.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.1874,
      "eval_loss": 0.2637251317501068,
      "eval_runtime": 9.8272,
      "eval_samples_per_second": 172.175,
      "eval_steps_per_second": 1.425,
      "step": 81
    },
    {
      "epoch": 4.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.2973,
      "eval_loss": 0.24176451563835144,
      "eval_runtime": 9.7849,
      "eval_samples_per_second": 172.92,
      "eval_steps_per_second": 1.431,
      "step": 108
    },
    {
      "epoch": 5.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.2494,
      "eval_loss": 0.2737601399421692,
      "eval_runtime": 10.431,
      "eval_samples_per_second": 162.209,
      "eval_steps_per_second": 1.342,
      "step": 135
    },
    {
      "epoch": 6.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.3812,
      "eval_loss": 0.19136066734790802,
      "eval_runtime": 9.9867,
      "eval_samples_per_second": 169.425,
      "eval_steps_per_second": 1.402,
      "step": 162
    },
    {
      "epoch": 7.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.3983,
      "eval_loss": 0.16406123340129852,
      "eval_runtime": 9.9234,
      "eval_samples_per_second": 170.505,
      "eval_steps_per_second": 1.411,
      "step": 189
    },
    {
      "epoch": 8.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.3995,
      "eval_loss": 0.16948193311691284,
      "eval_runtime": 10.0828,
      "eval_samples_per_second": 167.811,
      "eval_steps_per_second": 1.389,
      "step": 216
    },
    {
      "epoch": 9.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4167,
      "eval_loss": 0.15213139355182648,
      "eval_runtime": 9.7652,
      "eval_samples_per_second": 173.268,
      "eval_steps_per_second": 1.434,
      "step": 243
    },
    {
      "epoch": 10.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4167,
      "eval_loss": 0.15690775215625763,
      "eval_runtime": 9.8519,
      "eval_samples_per_second": 171.743,
      "eval_steps_per_second": 1.421,
      "step": 270
    },
    {
      "epoch": 11.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4137,
      "eval_loss": 0.16145527362823486,
      "eval_runtime": 9.771,
      "eval_samples_per_second": 173.166,
      "eval_steps_per_second": 1.433,
      "step": 297
    },
    {
      "epoch": 12.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4238,
      "eval_loss": 0.1473228484392166,
      "eval_runtime": 9.9975,
      "eval_samples_per_second": 169.242,
      "eval_steps_per_second": 1.4,
      "step": 324
    },
    {
      "epoch": 13.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4255,
      "eval_loss": 0.13761219382286072,
      "eval_runtime": 9.8987,
      "eval_samples_per_second": 170.931,
      "eval_steps_per_second": 1.414,
      "step": 351
    },
    {
      "epoch": 14.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.419,
      "eval_loss": 0.14949482679367065,
      "eval_runtime": 10.1968,
      "eval_samples_per_second": 165.935,
      "eval_steps_per_second": 1.373,
      "step": 378
    },
    {
      "epoch": 15.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.432,
      "eval_loss": 0.13342921435832977,
      "eval_runtime": 9.9102,
      "eval_samples_per_second": 170.734,
      "eval_steps_per_second": 1.413,
      "step": 405
    },
    {
      "epoch": 16.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4214,
      "eval_loss": 0.1473984271287918,
      "eval_runtime": 9.8919,
      "eval_samples_per_second": 171.049,
      "eval_steps_per_second": 1.415,
      "step": 432
    },
    {
      "epoch": 17.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4291,
      "eval_loss": 0.1483658105134964,
      "eval_runtime": 9.911,
      "eval_samples_per_second": 170.72,
      "eval_steps_per_second": 1.413,
      "step": 459
    },
    {
      "epoch": 18.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4297,
      "eval_loss": 0.1407216191291809,
      "eval_runtime": 9.8716,
      "eval_samples_per_second": 171.4,
      "eval_steps_per_second": 1.418,
      "step": 486
    },
    {
      "epoch": 18.52,
      "learning_rate": 0.0001,
      "loss": 0.1905,
      "step": 500
    },
    {
      "epoch": 19.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4208,
      "eval_loss": 0.15682467818260193,
      "eval_runtime": 9.8237,
      "eval_samples_per_second": 172.237,
      "eval_steps_per_second": 1.425,
      "step": 513
    },
    {
      "epoch": 20.0,
      "eval_bleu": 0.0,
      "eval_gen_len": 2.4261,
      "eval_loss": 0.16313956677913666,
      "eval_runtime": 9.8505,
      "eval_samples_per_second": 171.767,
      "eval_steps_per_second": 1.421,
      "step": 540
    },
    {
      "epoch": 20.0,
      "step": 540,
      "total_flos": 2.4870877697304166e+17,
      "train_loss": 0.18235577079984877,
      "train_runtime": 3852.2155,
      "train_samples_per_second": 71.143,
      "train_steps_per_second": 0.14
    }
  ],
  "max_steps": 540,
  "num_train_epochs": 20,
  "total_flos": 2.4870877697304166e+17,
  "trial_name": null,
  "trial_params": null
}