mp-02 commited on
Commit
d3d7e7a
1 Parent(s): 0e686e2

End of training

Browse files
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
- "epoch": 33.33,
3
- "eval_accuracy": 0.8486449242076252,
4
- "eval_f1": 0.8948016752894803,
5
- "eval_loss": 0.6415959000587463,
6
- "eval_precision": 0.8819815444390481,
7
- "eval_recall": 0.908,
8
- "eval_runtime": 2.3617,
9
  "eval_samples": 54,
10
- "eval_samples_per_second": 22.865,
11
- "eval_steps_per_second": 2.541,
12
  "predict_accuracy": 0.8218373936014088,
13
  "predict_f1": 0.9038133181559477,
14
  "predict_loss": 0.6888472437858582,
@@ -17,9 +17,9 @@
17
  "predict_runtime": 2.0596,
18
  "predict_samples_per_second": 8.74,
19
  "predict_steps_per_second": 0.971,
20
- "train_loss": 0.2944237976074219,
21
- "train_runtime": 336.0216,
22
  "train_samples": 150,
23
- "train_samples_per_second": 14.88,
24
- "train_steps_per_second": 1.488
25
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.8104042259990814,
4
+ "eval_f1": 0.8313368471490178,
5
+ "eval_loss": 0.5929840803146362,
6
+ "eval_precision": 0.7980680772769089,
7
+ "eval_recall": 0.8675,
8
+ "eval_runtime": 2.4572,
9
  "eval_samples": 54,
10
+ "eval_samples_per_second": 21.976,
11
+ "eval_steps_per_second": 2.442,
12
  "predict_accuracy": 0.8218373936014088,
13
  "predict_f1": 0.9038133181559477,
14
  "predict_loss": 0.6888472437858582,
 
17
  "predict_runtime": 2.0596,
18
  "predict_samples_per_second": 8.74,
19
  "predict_steps_per_second": 0.971,
20
+ "train_loss": 0.7810765075683593,
21
+ "train_runtime": 94.7164,
22
  "train_samples": 150,
23
+ "train_samples_per_second": 15.837,
24
+ "train_steps_per_second": 1.584
25
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 33.33,
3
- "eval_accuracy": 0.8486449242076252,
4
- "eval_f1": 0.8948016752894803,
5
- "eval_loss": 0.6415959000587463,
6
- "eval_precision": 0.8819815444390481,
7
- "eval_recall": 0.908,
8
- "eval_runtime": 2.3617,
9
  "eval_samples": 54,
10
- "eval_samples_per_second": 22.865,
11
- "eval_steps_per_second": 2.541
12
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.8104042259990814,
4
+ "eval_f1": 0.8313368471490178,
5
+ "eval_loss": 0.5929840803146362,
6
+ "eval_precision": 0.7980680772769089,
7
+ "eval_recall": 0.8675,
8
+ "eval_runtime": 2.4572,
9
  "eval_samples": 54,
10
+ "eval_samples_per_second": 21.976,
11
+ "eval_steps_per_second": 2.442
12
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:581afe274c45186d257308d437c3b39177f22b873e3cad10cde8017af1ae1d98
3
  size 501420883
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:841506f6c6c0a194bcb07157467ddcf167f6909db9a6af7260982b8d5abc6e08
3
  size 501420883
runs/Aug24_18-18-57_bernini/1724516347.7137752/events.out.tfevents.1724516347.bernini.11667.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58afa5d01e53942957c99fbb80b093bed7b1b20ce1a6dc0db13e7c827306a40f
3
+ size 4671
runs/Aug24_18-18-57_bernini/events.out.tfevents.1724516347.bernini.11667.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10ee7afbe996f4a10db0be4b2ddbe3fb2f86ed738ee577f1b56295119c376792
3
+ size 7229
runs/Aug24_18-18-57_bernini/events.out.tfevents.1724516450.bernini.11667.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bb9cbc7fbead01c5392d25c8908895a62506270486c77d4eaca2eb7edb3cd25
3
+ size 512
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 33.33,
3
- "train_loss": 0.2944237976074219,
4
- "train_runtime": 336.0216,
5
  "train_samples": 150,
6
- "train_samples_per_second": 14.88,
7
- "train_steps_per_second": 1.488
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "train_loss": 0.7810765075683593,
4
+ "train_runtime": 94.7164,
5
  "train_samples": 150,
6
+ "train_samples_per_second": 15.837,
7
+ "train_steps_per_second": 1.584
8
  }
trainer_state.json CHANGED
@@ -1,151 +1,97 @@
1
  {
2
- "best_metric": 0.8948016752894803,
3
- "best_model_checkpoint": "/media/HDD/mpizzol/Tirocinio/layoutlmv3-base-finetuned-funsd/checkpoint-500",
4
- "epoch": 33.333333333333336,
5
- "global_step": 500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 3.33,
12
- "eval_accuracy": 0.7633210840606339,
13
- "eval_f1": 0.78394616678683,
14
- "eval_loss": 0.7809513211250305,
15
- "eval_precision": 0.7547431744562703,
16
- "eval_recall": 0.8155,
17
- "eval_runtime": 2.4166,
18
- "eval_samples_per_second": 22.346,
19
- "eval_steps_per_second": 2.483,
20
- "step": 50
21
- },
22
- {
23
- "epoch": 6.67,
24
- "eval_accuracy": 0.8060404225999082,
25
- "eval_f1": 0.8391708363116512,
26
- "eval_loss": 0.5576171278953552,
27
- "eval_precision": 0.8015475648611743,
28
- "eval_recall": 0.8805,
29
- "eval_runtime": 2.4186,
30
- "eval_samples_per_second": 22.327,
31
- "eval_steps_per_second": 2.481,
32
- "step": 100
33
  },
34
  {
35
- "epoch": 10.0,
36
- "eval_accuracy": 0.822347266881029,
37
- "eval_f1": 0.8655769699926811,
38
- "eval_loss": 0.5810444355010986,
39
- "eval_precision": 0.845164363982849,
40
- "eval_recall": 0.887,
41
- "eval_runtime": 2.3446,
42
- "eval_samples_per_second": 23.032,
43
- "eval_steps_per_second": 2.559,
44
- "step": 150
45
- },
46
- {
47
- "epoch": 13.33,
48
- "eval_accuracy": 0.8393431327514929,
49
- "eval_f1": 0.8725060827250608,
50
- "eval_loss": 0.5633729100227356,
51
- "eval_precision": 0.8497630331753554,
52
- "eval_recall": 0.8965,
53
- "eval_runtime": 2.3645,
54
- "eval_samples_per_second": 22.837,
55
- "eval_steps_per_second": 2.537,
56
- "step": 200
57
- },
58
- {
59
- "epoch": 16.67,
60
- "eval_accuracy": 0.8528938906752411,
61
- "eval_f1": 0.8940364711680631,
62
- "eval_loss": 0.5418661236763,
63
- "eval_precision": 0.8814382896015549,
64
- "eval_recall": 0.907,
65
- "eval_runtime": 2.3455,
66
- "eval_samples_per_second": 23.023,
67
- "eval_steps_per_second": 2.558,
68
- "step": 250
69
- },
70
- {
71
- "epoch": 20.0,
72
- "eval_accuracy": 0.8464630225080386,
73
- "eval_f1": 0.8880670611439841,
74
- "eval_loss": 0.5817353129386902,
75
- "eval_precision": 0.8759727626459144,
76
- "eval_recall": 0.9005,
77
- "eval_runtime": 2.3522,
78
- "eval_samples_per_second": 22.957,
79
- "eval_steps_per_second": 2.551,
80
- "step": 300
81
- },
82
- {
83
- "epoch": 23.33,
84
- "eval_accuracy": 0.8429030776297657,
85
- "eval_f1": 0.8911230995586071,
86
- "eval_loss": 0.6015072464942932,
87
- "eval_precision": 0.8743984600577478,
88
- "eval_recall": 0.9085,
89
- "eval_runtime": 2.3531,
90
- "eval_samples_per_second": 22.948,
91
- "eval_steps_per_second": 2.55,
92
- "step": 350
93
  },
94
  {
95
- "epoch": 26.67,
96
- "eval_accuracy": 0.8535829122645843,
97
- "eval_f1": 0.8996811380917341,
98
- "eval_loss": 0.5981678366661072,
99
- "eval_precision": 0.8830043331728454,
100
- "eval_recall": 0.917,
101
- "eval_runtime": 2.4921,
102
- "eval_samples_per_second": 21.669,
103
- "eval_steps_per_second": 2.408,
104
- "step": 400
105
  },
106
  {
107
- "epoch": 30.0,
108
- "eval_accuracy": 0.8493339457969683,
109
- "eval_f1": 0.8949185989146522,
110
- "eval_loss": 0.6316392421722412,
111
- "eval_precision": 0.8831548198636806,
112
- "eval_recall": 0.907,
113
- "eval_runtime": 2.359,
114
- "eval_samples_per_second": 22.891,
115
- "eval_steps_per_second": 2.543,
116
- "step": 450
117
  },
118
  {
119
- "epoch": 33.33,
120
- "learning_rate": 0.0,
121
- "loss": 0.2944,
122
- "step": 500
 
 
 
 
 
 
123
  },
124
  {
125
- "epoch": 33.33,
126
- "eval_accuracy": 0.8486449242076252,
127
- "eval_f1": 0.8948016752894803,
128
- "eval_loss": 0.6415959000587463,
129
- "eval_precision": 0.8819815444390481,
130
- "eval_recall": 0.908,
131
- "eval_runtime": 2.3662,
132
- "eval_samples_per_second": 22.821,
133
- "eval_steps_per_second": 2.536,
134
- "step": 500
135
  },
136
  {
137
- "epoch": 33.33,
138
- "step": 500,
139
- "total_flos": 1318026716160000.0,
140
- "train_loss": 0.2944237976074219,
141
- "train_runtime": 336.0216,
142
- "train_samples_per_second": 14.88,
143
- "train_steps_per_second": 1.488
144
  }
145
  ],
146
- "max_steps": 500,
147
- "num_train_epochs": 34,
148
- "total_flos": 1318026716160000.0,
149
  "trial_name": null,
150
  "trial_params": null
151
  }
 
1
  {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 10.0,
5
+ "global_step": 150,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 1.67,
12
+ "eval_accuracy": 0.6559485530546624,
13
+ "eval_f1": 0.48850983179341384,
14
+ "eval_loss": 1.2209023237228394,
15
+ "eval_precision": 0.46420531292210715,
16
+ "eval_recall": 0.5155,
17
+ "eval_runtime": 2.3635,
18
+ "eval_samples_per_second": 22.848,
19
+ "eval_steps_per_second": 2.539,
20
+ "step": 25
 
 
 
 
 
 
 
 
 
 
 
 
21
  },
22
  {
23
+ "epoch": 3.33,
24
+ "eval_accuracy": 0.7619430408819476,
25
+ "eval_f1": 0.7535809662539452,
26
+ "eval_loss": 0.8171831965446472,
27
+ "eval_precision": 0.732420953279849,
28
+ "eval_recall": 0.776,
29
+ "eval_runtime": 2.3634,
30
+ "eval_samples_per_second": 22.849,
31
+ "eval_steps_per_second": 2.539,
32
+ "step": 50
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  },
34
  {
35
+ "epoch": 5.0,
36
+ "eval_accuracy": 0.8125861276986679,
37
+ "eval_f1": 0.8145823273780782,
38
+ "eval_loss": 0.6125288605690002,
39
+ "eval_precision": 0.7875816993464052,
40
+ "eval_recall": 0.8435,
41
+ "eval_runtime": 2.3662,
42
+ "eval_samples_per_second": 22.821,
43
+ "eval_steps_per_second": 2.536,
44
+ "step": 75
45
  },
46
  {
47
+ "epoch": 6.67,
48
+ "eval_accuracy": 0.8107487367937529,
49
+ "eval_f1": 0.8347784200385356,
50
+ "eval_loss": 0.5983520150184631,
51
+ "eval_precision": 0.8052973977695167,
52
+ "eval_recall": 0.8665,
53
+ "eval_runtime": 2.4636,
54
+ "eval_samples_per_second": 21.92,
55
+ "eval_steps_per_second": 2.436,
56
+ "step": 100
57
  },
58
  {
59
+ "epoch": 8.33,
60
+ "eval_accuracy": 0.8216582452916859,
61
+ "eval_f1": 0.8363723608445298,
62
+ "eval_loss": 0.5673876404762268,
63
+ "eval_precision": 0.8039667896678967,
64
+ "eval_recall": 0.8715,
65
+ "eval_runtime": 2.3684,
66
+ "eval_samples_per_second": 22.8,
67
+ "eval_steps_per_second": 2.533,
68
+ "step": 125
69
  },
70
  {
71
+ "epoch": 10.0,
72
+ "eval_accuracy": 0.8104042259990814,
73
+ "eval_f1": 0.8313368471490178,
74
+ "eval_loss": 0.5929840803146362,
75
+ "eval_precision": 0.7980680772769089,
76
+ "eval_recall": 0.8675,
77
+ "eval_runtime": 2.4505,
78
+ "eval_samples_per_second": 22.036,
79
+ "eval_steps_per_second": 2.448,
80
+ "step": 150
81
  },
82
  {
83
+ "epoch": 10.0,
84
+ "step": 150,
85
+ "total_flos": 395408014848000.0,
86
+ "train_loss": 0.7810765075683593,
87
+ "train_runtime": 94.7164,
88
+ "train_samples_per_second": 15.837,
89
+ "train_steps_per_second": 1.584
90
  }
91
  ],
92
+ "max_steps": 150,
93
+ "num_train_epochs": 10,
94
+ "total_flos": 395408014848000.0,
95
  "trial_name": null,
96
  "trial_params": null
97
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:adc75eed38996e422651fb9e6e4b3f368310b1c9ad2de49c697d8cc53283e4b5
3
  size 2927
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67e671d048c6381947443975ece3fe1b7ffa48552b826dcbe8f9155c1dca716d
3
  size 2927