HorcruxNo13 commited on
Commit
a6553e0
1 Parent(s): 5215552

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
- "train_loss": 0.5463650396892002,
5
- "train_runtime": 159.2288,
6
- "train_samples_per_second": 43.962,
7
- "train_steps_per_second": 0.352
8
  }
 
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
+ "train_loss": 0.5857737362384796,
5
+ "train_runtime": 257.742,
6
+ "train_samples_per_second": 27.159,
7
+ "train_steps_per_second": 0.217
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3767eccbee6326874ee4ee31faf86b112c49f69226fb388dad681c5c9a0ad176
3
  size 110394865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12b05e450262fc68a5119dd5a3fb702fe0f750f289d47e5fd3597756068b0481
3
  size 110394865
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
- "train_loss": 0.5463650396892002,
5
- "train_runtime": 159.2288,
6
- "train_samples_per_second": 43.962,
7
- "train_steps_per_second": 0.352
8
  }
 
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
+ "train_loss": 0.5857737362384796,
5
+ "train_runtime": 257.742,
6
+ "train_samples_per_second": 27.159,
7
+ "train_steps_per_second": 0.217
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.7583333333333333,
3
  "best_model_checkpoint": "swin-tiny-patch4-window7-224/checkpoint-48",
4
  "epoch": 7.0,
5
  "eval_steps": 500,
@@ -11,112 +11,136 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_accuracy": 0.7333333333333333,
14
- "eval_loss": 0.58155757188797,
15
- "eval_runtime": 1.8232,
16
- "eval_samples_per_second": 131.637,
17
- "eval_steps_per_second": 4.388,
 
 
 
18
  "step": 8
19
  },
20
  {
21
  "epoch": 1.25,
22
  "learning_rate": 4.600000000000001e-05,
23
- "loss": 0.6478,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 2.0,
28
  "eval_accuracy": 0.7333333333333333,
29
- "eval_loss": 0.5633648037910461,
30
- "eval_runtime": 1.8405,
31
- "eval_samples_per_second": 130.396,
32
- "eval_steps_per_second": 4.347,
 
 
 
33
  "step": 16
34
  },
35
  {
36
  "epoch": 2.5,
37
  "learning_rate": 3.6e-05,
38
- "loss": 0.5746,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 3.0,
43
- "eval_accuracy": 0.7375,
44
- "eval_loss": 0.5526280999183655,
45
- "eval_runtime": 1.8724,
46
- "eval_samples_per_second": 128.178,
47
- "eval_steps_per_second": 4.273,
 
 
 
48
  "step": 24
49
  },
50
  {
51
  "epoch": 3.75,
52
  "learning_rate": 2.6000000000000002e-05,
53
- "loss": 0.5414,
54
  "step": 30
55
  },
56
  {
57
  "epoch": 4.0,
58
  "eval_accuracy": 0.7333333333333333,
59
- "eval_loss": 0.6044233441352844,
60
- "eval_runtime": 3.3038,
61
- "eval_samples_per_second": 72.644,
62
- "eval_steps_per_second": 2.421,
 
 
 
63
  "step": 32
64
  },
65
  {
66
  "epoch": 5.0,
67
  "learning_rate": 1.6000000000000003e-05,
68
- "loss": 0.5159,
69
  "step": 40
70
  },
71
  {
72
  "epoch": 5.0,
73
- "eval_accuracy": 0.7541666666666667,
74
- "eval_loss": 0.5310245156288147,
75
- "eval_runtime": 2.8227,
76
- "eval_samples_per_second": 85.024,
77
- "eval_steps_per_second": 2.834,
 
 
 
78
  "step": 40
79
  },
80
  {
81
  "epoch": 6.0,
82
- "eval_accuracy": 0.7583333333333333,
83
- "eval_loss": 0.5481430888175964,
84
- "eval_runtime": 3.9583,
85
- "eval_samples_per_second": 60.632,
86
- "eval_steps_per_second": 2.021,
 
 
 
87
  "step": 48
88
  },
89
  {
90
  "epoch": 6.25,
91
  "learning_rate": 6e-06,
92
- "loss": 0.4901,
93
  "step": 50
94
  },
95
  {
96
  "epoch": 7.0,
97
- "eval_accuracy": 0.7583333333333333,
98
- "eval_loss": 0.5410298109054565,
99
- "eval_runtime": 2.4531,
100
- "eval_samples_per_second": 97.834,
101
- "eval_steps_per_second": 3.261,
 
 
 
102
  "step": 56
103
  },
104
  {
105
  "epoch": 7.0,
106
  "step": 56,
107
  "total_flos": 1.73991922900992e+17,
108
- "train_loss": 0.5463650396892002,
109
- "train_runtime": 159.2288,
110
- "train_samples_per_second": 43.962,
111
- "train_steps_per_second": 0.352
112
  },
113
  {
114
  "epoch": 7.0,
115
  "eval_accuracy": 0.7366666666666667,
116
- "eval_loss": 0.5300371050834656,
117
- "eval_runtime": 4.2651,
118
- "eval_samples_per_second": 70.339,
119
- "eval_steps_per_second": 2.345,
 
 
 
120
  "step": 56
121
  }
122
  ],
 
1
  {
2
+ "best_metric": 0.7416666666666667,
3
  "best_model_checkpoint": "swin-tiny-patch4-window7-224/checkpoint-48",
4
  "epoch": 7.0,
5
  "eval_steps": 500,
 
11
  {
12
  "epoch": 1.0,
13
  "eval_accuracy": 0.7333333333333333,
14
+ "eval_f1_score": 0.6205128205128204,
15
+ "eval_loss": 0.5834997296333313,
16
+ "eval_precision": 0.5377777777777778,
17
+ "eval_recall": 0.7333333333333333,
18
+ "eval_runtime": 33.1193,
19
+ "eval_samples_per_second": 7.247,
20
+ "eval_steps_per_second": 0.242,
21
  "step": 8
22
  },
23
  {
24
  "epoch": 1.25,
25
  "learning_rate": 4.600000000000001e-05,
26
+ "loss": 0.6395,
27
  "step": 10
28
  },
29
  {
30
  "epoch": 2.0,
31
  "eval_accuracy": 0.7333333333333333,
32
+ "eval_f1_score": 0.6205128205128204,
33
+ "eval_loss": 0.5735692381858826,
34
+ "eval_precision": 0.5377777777777778,
35
+ "eval_recall": 0.7333333333333333,
36
+ "eval_runtime": 2.0727,
37
+ "eval_samples_per_second": 115.793,
38
+ "eval_steps_per_second": 3.86,
39
  "step": 16
40
  },
41
  {
42
  "epoch": 2.5,
43
  "learning_rate": 3.6e-05,
44
+ "loss": 0.5789,
45
  "step": 20
46
  },
47
  {
48
  "epoch": 3.0,
49
+ "eval_accuracy": 0.7333333333333333,
50
+ "eval_f1_score": 0.6205128205128204,
51
+ "eval_loss": 0.5942796468734741,
52
+ "eval_precision": 0.5377777777777778,
53
+ "eval_recall": 0.7333333333333333,
54
+ "eval_runtime": 2.0683,
55
+ "eval_samples_per_second": 116.035,
56
+ "eval_steps_per_second": 3.868,
57
  "step": 24
58
  },
59
  {
60
  "epoch": 3.75,
61
  "learning_rate": 2.6000000000000002e-05,
62
+ "loss": 0.5887,
63
  "step": 30
64
  },
65
  {
66
  "epoch": 4.0,
67
  "eval_accuracy": 0.7333333333333333,
68
+ "eval_f1_score": 0.6205128205128204,
69
+ "eval_loss": 0.5613328218460083,
70
+ "eval_precision": 0.5377777777777778,
71
+ "eval_recall": 0.7333333333333333,
72
+ "eval_runtime": 2.0585,
73
+ "eval_samples_per_second": 116.592,
74
+ "eval_steps_per_second": 3.886,
75
  "step": 32
76
  },
77
  {
78
  "epoch": 5.0,
79
  "learning_rate": 1.6000000000000003e-05,
80
+ "loss": 0.5791,
81
  "step": 40
82
  },
83
  {
84
  "epoch": 5.0,
85
+ "eval_accuracy": 0.7333333333333333,
86
+ "eval_f1_score": 0.6205128205128204,
87
+ "eval_loss": 0.5557453036308289,
88
+ "eval_precision": 0.5377777777777778,
89
+ "eval_recall": 0.7333333333333333,
90
+ "eval_runtime": 2.0897,
91
+ "eval_samples_per_second": 114.847,
92
+ "eval_steps_per_second": 3.828,
93
  "step": 40
94
  },
95
  {
96
  "epoch": 6.0,
97
+ "eval_accuracy": 0.7416666666666667,
98
+ "eval_f1_score": 0.6396720831503441,
99
+ "eval_loss": 0.5535091161727905,
100
+ "eval_precision": 0.8089635854341737,
101
+ "eval_recall": 0.7416666666666667,
102
+ "eval_runtime": 1.9813,
103
+ "eval_samples_per_second": 121.134,
104
+ "eval_steps_per_second": 4.038,
105
  "step": 48
106
  },
107
  {
108
  "epoch": 6.25,
109
  "learning_rate": 6e-06,
110
+ "loss": 0.5717,
111
  "step": 50
112
  },
113
  {
114
  "epoch": 7.0,
115
+ "eval_accuracy": 0.7333333333333333,
116
+ "eval_f1_score": 0.6205128205128204,
117
+ "eval_loss": 0.5456091165542603,
118
+ "eval_precision": 0.5377777777777778,
119
+ "eval_recall": 0.7333333333333333,
120
+ "eval_runtime": 2.0655,
121
+ "eval_samples_per_second": 116.197,
122
+ "eval_steps_per_second": 3.873,
123
  "step": 56
124
  },
125
  {
126
  "epoch": 7.0,
127
  "step": 56,
128
  "total_flos": 1.73991922900992e+17,
129
+ "train_loss": 0.5857737362384796,
130
+ "train_runtime": 257.742,
131
+ "train_samples_per_second": 27.159,
132
+ "train_steps_per_second": 0.217
133
  },
134
  {
135
  "epoch": 7.0,
136
  "eval_accuracy": 0.7366666666666667,
137
+ "eval_f1_score": 0.6314646594113398,
138
+ "eval_loss": 0.5486770868301392,
139
+ "eval_precision": 0.8064765100671142,
140
+ "eval_recall": 0.7366666666666667,
141
+ "eval_runtime": 109.0657,
142
+ "eval_samples_per_second": 2.751,
143
+ "eval_steps_per_second": 0.092,
144
  "step": 56
145
  }
146
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5aff4bdc67ae077b0bf7d175151eed746c480633a9d9571a02c41d85a9abb5f2
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb7e8116dbe569fb96ff854b905cb0bc3ae5795528e7afede2c8328a68bddc7d
3
  size 4091