Leeyuyu commited on
Commit
f4d8397
1 Parent(s): 705604a

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,8 +1,13 @@
1
  {
2
  "epoch": 8.0,
 
 
 
 
 
3
  "total_flos": 7.078985663171789e+16,
4
- "train_loss": 0.5772393196821213,
5
- "train_runtime": 61.0545,
6
- "train_samples_per_second": 46.647,
7
- "train_steps_per_second": 0.393
8
  }
 
1
  {
2
  "epoch": 8.0,
3
+ "eval_loss": 0.446413516998291,
4
+ "eval_roc_auc": 0.7681704260651628,
5
+ "eval_runtime": 0.4149,
6
+ "eval_samples_per_second": 96.41,
7
+ "eval_steps_per_second": 4.821,
8
  "total_flos": 7.078985663171789e+16,
9
+ "train_loss": 0.4116581827402115,
10
+ "train_runtime": 69.7528,
11
+ "train_samples_per_second": 40.83,
12
+ "train_steps_per_second": 0.344
13
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.0,
3
+ "eval_loss": 0.446413516998291,
4
+ "eval_roc_auc": 0.7681704260651628,
5
+ "eval_runtime": 0.4149,
6
+ "eval_samples_per_second": 96.41,
7
+ "eval_steps_per_second": 4.821
8
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cacf0d6edf3dc7b8e2f8686a95e060e12d60468ed93f4ee6899c2c548e5baa96
3
  size 110394865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c1106773d6025eb34315bde144095028f612768318d1f1761ab93a0a934f1ec
3
  size 110394865
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 8.0,
3
  "total_flos": 7.078985663171789e+16,
4
- "train_loss": 0.5772393196821213,
5
- "train_runtime": 61.0545,
6
- "train_samples_per_second": 46.647,
7
- "train_steps_per_second": 0.393
8
  }
 
1
  {
2
  "epoch": 8.0,
3
  "total_flos": 7.078985663171789e+16,
4
+ "train_loss": 0.4116581827402115,
5
+ "train_runtime": 69.7528,
6
+ "train_samples_per_second": 40.83,
7
+ "train_steps_per_second": 0.344
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.7631578947368421,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetunedo/checkpoint-24",
4
  "epoch": 8.0,
5
  "eval_steps": 500,
6
  "global_step": 24,
@@ -10,96 +10,96 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.7092229723930359,
14
- "eval_roc_auc": 0.581453634085213,
15
- "eval_runtime": 0.3335,
16
- "eval_samples_per_second": 119.954,
17
- "eval_steps_per_second": 5.998,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_loss": 0.6675325632095337,
23
- "eval_roc_auc": 0.5526315789473684,
24
- "eval_runtime": 0.2781,
25
- "eval_samples_per_second": 143.82,
26
- "eval_steps_per_second": 7.191,
27
  "step": 6
28
  },
29
  {
30
  "epoch": 3.0,
31
- "eval_loss": 0.6448550224304199,
32
- "eval_roc_auc": 0.5789473684210527,
33
- "eval_runtime": 0.3227,
34
- "eval_samples_per_second": 123.942,
35
- "eval_steps_per_second": 6.197,
36
  "step": 9
37
  },
38
  {
39
  "epoch": 3.33,
40
- "learning_rate": 2.6666666666666667e-05,
41
- "loss": 0.6541,
42
  "step": 10
43
  },
44
  {
45
  "epoch": 4.0,
46
- "eval_loss": 0.6078753471374512,
47
- "eval_roc_auc": 0.7105263157894737,
48
- "eval_runtime": 0.2706,
49
- "eval_samples_per_second": 147.82,
50
- "eval_steps_per_second": 7.391,
51
  "step": 12
52
  },
53
  {
54
  "epoch": 5.0,
55
- "eval_loss": 0.5968624353408813,
56
- "eval_roc_auc": 0.7105263157894737,
57
- "eval_runtime": 0.3291,
58
- "eval_samples_per_second": 121.557,
59
- "eval_steps_per_second": 6.078,
60
  "step": 15
61
  },
62
  {
63
  "epoch": 6.0,
64
- "eval_loss": 0.564300537109375,
65
- "eval_roc_auc": 0.7105263157894737,
66
- "eval_runtime": 0.2928,
67
- "eval_samples_per_second": 136.627,
68
- "eval_steps_per_second": 6.831,
69
  "step": 18
70
  },
71
  {
72
  "epoch": 6.67,
73
- "learning_rate": 7.61904761904762e-06,
74
- "loss": 0.5334,
75
  "step": 20
76
  },
77
  {
78
  "epoch": 7.0,
79
- "eval_loss": 0.5328788161277771,
80
- "eval_roc_auc": 0.7105263157894737,
81
- "eval_runtime": 0.2769,
82
- "eval_samples_per_second": 144.431,
83
- "eval_steps_per_second": 7.222,
84
  "step": 21
85
  },
86
  {
87
  "epoch": 8.0,
88
- "eval_loss": 0.5234358906745911,
89
- "eval_roc_auc": 0.7631578947368421,
90
- "eval_runtime": 0.2763,
91
- "eval_samples_per_second": 144.791,
92
- "eval_steps_per_second": 7.24,
93
  "step": 24
94
  },
95
  {
96
  "epoch": 8.0,
97
  "step": 24,
98
  "total_flos": 7.078985663171789e+16,
99
- "train_loss": 0.5772393196821213,
100
- "train_runtime": 61.0545,
101
- "train_samples_per_second": 46.647,
102
- "train_steps_per_second": 0.393
103
  }
104
  ],
105
  "logging_steps": 10,
 
1
  {
2
+ "best_metric": 0.7681704260651628,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetunedo/checkpoint-12",
4
  "epoch": 8.0,
5
  "eval_steps": 500,
6
  "global_step": 24,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.5081062316894531,
14
+ "eval_roc_auc": 0.736842105263158,
15
+ "eval_runtime": 0.5379,
16
+ "eval_samples_per_second": 74.363,
17
+ "eval_steps_per_second": 3.718,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_loss": 0.43417197465896606,
23
+ "eval_roc_auc": 0.7631578947368421,
24
+ "eval_runtime": 0.5781,
25
+ "eval_samples_per_second": 69.192,
26
+ "eval_steps_per_second": 3.46,
27
  "step": 6
28
  },
29
  {
30
  "epoch": 3.0,
31
+ "eval_loss": 0.43640345335006714,
32
+ "eval_roc_auc": 0.7493734335839599,
33
+ "eval_runtime": 0.3468,
34
+ "eval_samples_per_second": 115.327,
35
+ "eval_steps_per_second": 5.766,
36
  "step": 9
37
  },
38
  {
39
  "epoch": 3.33,
40
+ "learning_rate": 3.3333333333333335e-05,
41
+ "loss": 0.4067,
42
  "step": 10
43
  },
44
  {
45
  "epoch": 4.0,
46
+ "eval_loss": 0.446413516998291,
47
+ "eval_roc_auc": 0.7681704260651628,
48
+ "eval_runtime": 0.2866,
49
+ "eval_samples_per_second": 139.576,
50
+ "eval_steps_per_second": 6.979,
51
  "step": 12
52
  },
53
  {
54
  "epoch": 5.0,
55
+ "eval_loss": 0.46299201250076294,
56
+ "eval_roc_auc": 0.7656641604010025,
57
+ "eval_runtime": 0.2863,
58
+ "eval_samples_per_second": 139.701,
59
+ "eval_steps_per_second": 6.985,
60
  "step": 15
61
  },
62
  {
63
  "epoch": 6.0,
64
+ "eval_loss": 0.45169758796691895,
65
+ "eval_roc_auc": 0.744360902255639,
66
+ "eval_runtime": 0.3942,
67
+ "eval_samples_per_second": 101.474,
68
+ "eval_steps_per_second": 5.074,
69
  "step": 18
70
  },
71
  {
72
  "epoch": 6.67,
73
+ "learning_rate": 9.523809523809523e-06,
74
+ "loss": 0.4211,
75
  "step": 20
76
  },
77
  {
78
  "epoch": 7.0,
79
+ "eval_loss": 0.4539761543273926,
80
+ "eval_roc_auc": 0.7180451127819549,
81
+ "eval_runtime": 0.2978,
82
+ "eval_samples_per_second": 134.324,
83
+ "eval_steps_per_second": 6.716,
84
  "step": 21
85
  },
86
  {
87
  "epoch": 8.0,
88
+ "eval_loss": 0.45407772064208984,
89
+ "eval_roc_auc": 0.7180451127819549,
90
+ "eval_runtime": 0.2973,
91
+ "eval_samples_per_second": 134.55,
92
+ "eval_steps_per_second": 6.728,
93
  "step": 24
94
  },
95
  {
96
  "epoch": 8.0,
97
  "step": 24,
98
  "total_flos": 7.078985663171789e+16,
99
+ "train_loss": 0.4116581827402115,
100
+ "train_runtime": 69.7528,
101
+ "train_samples_per_second": 40.83,
102
+ "train_steps_per_second": 0.344
103
  }
104
  ],
105
  "logging_steps": 10,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ba6304179519bcbae92d5008c20f1e1ef48f8904f31d69f6a4e4cadb6285358
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1279cbb2da12d0b87c1cb3f82e87a85c6eda9e64d36cfe842b264fd4214434f9
3
  size 4091