rachidsaid commited on
Commit
15b6d62
1 Parent(s): 80cf076

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.23,
3
- "eval_accuracy": 0.7870967741935484,
4
- "eval_loss": 0.4868558943271637,
5
- "eval_runtime": 149.4696,
6
- "eval_samples_per_second": 1.037,
7
- "eval_steps_per_second": 0.134
8
  }
 
1
  {
2
  "epoch": 3.23,
3
+ "eval_accuracy": 0.8516129032258064,
4
+ "eval_loss": 0.4354906678199768,
5
+ "eval_runtime": 104.5631,
6
+ "eval_samples_per_second": 1.482,
7
+ "eval_steps_per_second": 0.191
8
  }
runs/Jul03_15-16-36_e0f8396b976e/events.out.tfevents.1688400695.e0f8396b976e.796.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb7e9382ba8ddf43421e952986d1a49a76ab7015bd1e2b2b3ece8f20c94a2029
3
- size 411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47b1f245da788e2cdbbbdcb211b26336f171c77bbd4c4571879c30a2175d83e2
3
+ size 734
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.23,
3
- "eval_accuracy": 0.7870967741935484,
4
- "eval_loss": 0.4868558943271637,
5
- "eval_runtime": 149.4696,
6
- "eval_samples_per_second": 1.037,
7
- "eval_steps_per_second": 0.134
8
  }
 
1
  {
2
  "epoch": 3.23,
3
+ "eval_accuracy": 0.8516129032258064,
4
+ "eval_loss": 0.4354906678199768,
5
+ "eval_runtime": 104.5631,
6
+ "eval_samples_per_second": 1.482,
7
+ "eval_steps_per_second": 0.191
8
  }
trainer_state.json CHANGED
@@ -10,148 +10,148 @@
10
  {
11
  "epoch": 0.07,
12
  "learning_rate": 3.3333333333333335e-05,
13
- "loss": 2.2791,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.14,
18
  "learning_rate": 4.81203007518797e-05,
19
- "loss": 2.1704,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.2,
24
  "learning_rate": 4.43609022556391e-05,
25
- "loss": 2.1335,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.26,
30
- "eval_accuracy": 0.5142857142857142,
31
- "eval_loss": 1.8132479190826416,
32
- "eval_runtime": 45.5282,
33
- "eval_samples_per_second": 1.538,
34
- "eval_steps_per_second": 0.198,
35
  "step": 38
36
  },
37
  {
38
  "epoch": 1.01,
39
  "learning_rate": 4.0601503759398494e-05,
40
- "loss": 2.0233,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 1.08,
45
  "learning_rate": 3.6842105263157895e-05,
46
- "loss": 1.5915,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.15,
51
  "learning_rate": 3.3082706766917295e-05,
52
- "loss": 1.2445,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.22,
57
  "learning_rate": 2.9323308270676693e-05,
58
- "loss": 0.9301,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.26,
63
- "eval_accuracy": 0.7714285714285715,
64
- "eval_loss": 0.8595510125160217,
65
- "eval_runtime": 66.0517,
66
- "eval_samples_per_second": 1.06,
67
- "eval_steps_per_second": 0.136,
68
  "step": 76
69
  },
70
  {
71
  "epoch": 2.03,
72
  "learning_rate": 2.556390977443609e-05,
73
- "loss": 0.8006,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 2.09,
78
  "learning_rate": 2.1804511278195487e-05,
79
- "loss": 0.664,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 2.16,
84
  "learning_rate": 1.8045112781954888e-05,
85
- "loss": 0.5401,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 2.23,
90
  "learning_rate": 1.4285714285714285e-05,
91
- "loss": 0.4422,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.26,
96
- "eval_accuracy": 0.8714285714285714,
97
- "eval_loss": 0.500382125377655,
98
- "eval_runtime": 69.7054,
99
- "eval_samples_per_second": 1.004,
100
- "eval_steps_per_second": 0.129,
101
  "step": 114
102
  },
103
  {
104
  "epoch": 3.04,
105
  "learning_rate": 1.0526315789473684e-05,
106
- "loss": 0.3282,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 3.11,
111
  "learning_rate": 6.766917293233083e-06,
112
- "loss": 0.3011,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 3.18,
117
  "learning_rate": 3.007518796992481e-06,
118
- "loss": 0.2828,
119
  "step": 140
120
  },
121
  {
122
  "epoch": 3.23,
123
  "eval_accuracy": 0.9142857142857143,
124
- "eval_loss": 0.37309029698371887,
125
- "eval_runtime": 70.3365,
126
- "eval_samples_per_second": 0.995,
127
- "eval_steps_per_second": 0.128,
128
  "step": 148
129
  },
130
  {
131
  "epoch": 3.23,
132
  "step": 148,
133
  "total_flos": 1.460491890402263e+18,
134
- "train_loss": 1.0764089355597626,
135
- "train_runtime": 3191.3076,
136
- "train_samples_per_second": 0.371,
137
- "train_steps_per_second": 0.046
138
  },
139
  {
140
  "epoch": 3.23,
141
- "eval_accuracy": 0.7870967741935484,
142
- "eval_loss": 0.4868559241294861,
143
- "eval_runtime": 150.5785,
144
- "eval_samples_per_second": 1.029,
145
- "eval_steps_per_second": 0.133,
146
  "step": 148
147
  },
148
  {
149
  "epoch": 3.23,
150
- "eval_accuracy": 0.7870967741935484,
151
- "eval_loss": 0.4868558943271637,
152
- "eval_runtime": 149.4696,
153
- "eval_samples_per_second": 1.037,
154
- "eval_steps_per_second": 0.134,
155
  "step": 148
156
  }
157
  ],
 
10
  {
11
  "epoch": 0.07,
12
  "learning_rate": 3.3333333333333335e-05,
13
+ "loss": 2.2591,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.14,
18
  "learning_rate": 4.81203007518797e-05,
19
+ "loss": 2.2132,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.2,
24
  "learning_rate": 4.43609022556391e-05,
25
+ "loss": 2.1351,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.26,
30
+ "eval_accuracy": 0.6285714285714286,
31
+ "eval_loss": 1.6582270860671997,
32
+ "eval_runtime": 48.1772,
33
+ "eval_samples_per_second": 1.453,
34
+ "eval_steps_per_second": 0.187,
35
  "step": 38
36
  },
37
  {
38
  "epoch": 1.01,
39
  "learning_rate": 4.0601503759398494e-05,
40
+ "loss": 1.9093,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 1.08,
45
  "learning_rate": 3.6842105263157895e-05,
46
+ "loss": 1.5111,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.15,
51
  "learning_rate": 3.3082706766917295e-05,
52
+ "loss": 1.1256,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.22,
57
  "learning_rate": 2.9323308270676693e-05,
58
+ "loss": 0.7409,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.26,
63
+ "eval_accuracy": 0.7142857142857143,
64
+ "eval_loss": 0.8406534194946289,
65
+ "eval_runtime": 39.133,
66
+ "eval_samples_per_second": 1.789,
67
+ "eval_steps_per_second": 0.23,
68
  "step": 76
69
  },
70
  {
71
  "epoch": 2.03,
72
  "learning_rate": 2.556390977443609e-05,
73
+ "loss": 0.8077,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 2.09,
78
  "learning_rate": 2.1804511278195487e-05,
79
+ "loss": 0.5975,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 2.16,
84
  "learning_rate": 1.8045112781954888e-05,
85
+ "loss": 0.6191,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 2.23,
90
  "learning_rate": 1.4285714285714285e-05,
91
+ "loss": 0.4333,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.26,
96
+ "eval_accuracy": 0.8142857142857143,
97
+ "eval_loss": 0.5106571316719055,
98
+ "eval_runtime": 41.2785,
99
+ "eval_samples_per_second": 1.696,
100
+ "eval_steps_per_second": 0.218,
101
  "step": 114
102
  },
103
  {
104
  "epoch": 3.04,
105
  "learning_rate": 1.0526315789473684e-05,
106
+ "loss": 0.3766,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 3.11,
111
  "learning_rate": 6.766917293233083e-06,
112
+ "loss": 0.265,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 3.18,
117
  "learning_rate": 3.007518796992481e-06,
118
+ "loss": 0.2766,
119
  "step": 140
120
  },
121
  {
122
  "epoch": 3.23,
123
  "eval_accuracy": 0.9142857142857143,
124
+ "eval_loss": 0.3579496741294861,
125
+ "eval_runtime": 49.2971,
126
+ "eval_samples_per_second": 1.42,
127
+ "eval_steps_per_second": 0.183,
128
  "step": 148
129
  },
130
  {
131
  "epoch": 3.23,
132
  "step": 148,
133
  "total_flos": 1.460491890402263e+18,
134
+ "train_loss": 1.0465768640105788,
135
+ "train_runtime": 3053.3069,
136
+ "train_samples_per_second": 0.388,
137
+ "train_steps_per_second": 0.048
138
  },
139
  {
140
  "epoch": 3.23,
141
+ "eval_accuracy": 0.8516129032258064,
142
+ "eval_loss": 0.43549060821533203,
143
+ "eval_runtime": 105.4615,
144
+ "eval_samples_per_second": 1.47,
145
+ "eval_steps_per_second": 0.19,
146
  "step": 148
147
  },
148
  {
149
  "epoch": 3.23,
150
+ "eval_accuracy": 0.8516129032258064,
151
+ "eval_loss": 0.4354906678199768,
152
+ "eval_runtime": 104.5631,
153
+ "eval_samples_per_second": 1.482,
154
+ "eval_steps_per_second": 0.191,
155
  "step": 148
156
  }
157
  ],