dima806 commited on
Commit
18e2042
1 Parent(s): 8768da0

Upload folder using huggingface_hub

Browse files
checkpoint-7623/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cce8ab6dbce6287960ea5fdf6432aa92c141bb2348dd8f398cd88288f69143a4
3
  size 343365480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6dc632b36bf1d57de1137187ecb65d61f8d0e7e44da4ff1872166954cf1b27e
3
  size 343365480
checkpoint-7623/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d2d6db04e237478c0203eb0fc447ab351526e0c29985b727d7453dab5a5cad2
3
  size 686851461
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:937e06b36df80b42a99a4fca22ca99b899519df98d0040ceffc85f07a3aefc3e
3
  size 686851461
checkpoint-7623/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 1.488718032836914,
3
  "best_model_checkpoint": "cat_breed_image_detection/checkpoint-7623",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
@@ -10,137 +10,137 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.19677292404565133,
13
- "grad_norm": 8.220705032348633,
14
  "learning_rate": 8.465205334741845e-07,
15
- "loss": 1.4752,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.39354584809130266,
20
- "grad_norm": 7.696910858154297,
21
  "learning_rate": 7.870989040010564e-07,
22
- "loss": 1.4833,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.5903187721369539,
27
- "grad_norm": 7.823228359222412,
28
  "learning_rate": 7.276772745279281e-07,
29
- "loss": 1.4728,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.7870916961826053,
34
- "grad_norm": 6.080297946929932,
35
  "learning_rate": 6.682556450547999e-07,
36
- "loss": 1.4901,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.9838646202282566,
41
- "grad_norm": 7.583363056182861,
42
  "learning_rate": 6.088340155816718e-07,
43
- "loss": 1.4755,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 1.0,
48
- "eval_accuracy": 0.6088537053439622,
49
- "eval_loss": 1.5104930400848389,
50
- "eval_model_preparation_time": 0.0053,
51
- "eval_runtime": 1216.8858,
52
- "eval_samples_per_second": 89.067,
53
- "eval_steps_per_second": 2.783,
54
  "step": 2541
55
  },
56
  {
57
  "epoch": 1.1806375442739079,
58
- "grad_norm": 9.293631553649902,
59
  "learning_rate": 5.494123861085435e-07,
60
- "loss": 1.4665,
61
  "step": 3000
62
  },
63
  {
64
  "epoch": 1.3774104683195592,
65
- "grad_norm": 8.063645362854004,
66
  "learning_rate": 4.899907566354153e-07,
67
- "loss": 1.4613,
68
  "step": 3500
69
  },
70
  {
71
  "epoch": 1.5741833923652107,
72
- "grad_norm": 6.942551612854004,
73
  "learning_rate": 4.3056912716228705e-07,
74
- "loss": 1.4569,
75
  "step": 4000
76
  },
77
  {
78
  "epoch": 1.770956316410862,
79
- "grad_norm": 11.436430931091309,
80
  "learning_rate": 3.7114749768915883e-07,
81
- "loss": 1.4412,
82
  "step": 4500
83
  },
84
  {
85
  "epoch": 1.9677292404565132,
86
- "grad_norm": 6.971865177154541,
87
  "learning_rate": 3.117258682160306e-07,
88
- "loss": 1.4428,
89
  "step": 5000
90
  },
91
  {
92
  "epoch": 2.0,
93
- "eval_accuracy": 0.6121660023619723,
94
- "eval_loss": 1.4942480325698853,
95
- "eval_model_preparation_time": 0.0053,
96
- "eval_runtime": 1210.5473,
97
- "eval_samples_per_second": 89.533,
98
- "eval_steps_per_second": 2.798,
99
  "step": 5082
100
  },
101
  {
102
  "epoch": 2.1645021645021645,
103
- "grad_norm": 7.25930643081665,
104
  "learning_rate": 2.523042387429024e-07,
105
- "loss": 1.4412,
106
  "step": 5500
107
  },
108
  {
109
  "epoch": 2.3612750885478158,
110
- "grad_norm": 8.07095718383789,
111
  "learning_rate": 1.928826092697742e-07,
112
- "loss": 1.4362,
113
  "step": 6000
114
  },
115
  {
116
  "epoch": 2.558048012593467,
117
- "grad_norm": 8.908621788024902,
118
  "learning_rate": 1.3346097979664598e-07,
119
- "loss": 1.4375,
120
  "step": 6500
121
  },
122
  {
123
  "epoch": 2.7548209366391183,
124
- "grad_norm": 8.16598129272461,
125
  "learning_rate": 7.403935032351777e-08,
126
- "loss": 1.4397,
127
  "step": 7000
128
  },
129
  {
130
  "epoch": 2.9515938606847696,
131
- "grad_norm": 9.264542579650879,
132
  "learning_rate": 1.4617720850389543e-08,
133
- "loss": 1.437,
134
  "step": 7500
135
  },
136
  {
137
  "epoch": 3.0,
138
- "eval_accuracy": 0.6130332890463537,
139
- "eval_loss": 1.488718032836914,
140
- "eval_model_preparation_time": 0.0053,
141
- "eval_runtime": 1205.355,
142
- "eval_samples_per_second": 89.919,
143
- "eval_steps_per_second": 2.81,
144
  "step": 7623
145
  }
146
  ],
 
1
  {
2
+ "best_metric": 1.4409993886947632,
3
  "best_model_checkpoint": "cat_breed_image_detection/checkpoint-7623",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.19677292404565133,
13
+ "grad_norm": 8.759430885314941,
14
  "learning_rate": 8.465205334741845e-07,
15
+ "loss": 1.4398,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.39354584809130266,
20
+ "grad_norm": 8.932340621948242,
21
  "learning_rate": 7.870989040010564e-07,
22
+ "loss": 1.4352,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.5903187721369539,
27
+ "grad_norm": 9.20963191986084,
28
  "learning_rate": 7.276772745279281e-07,
29
+ "loss": 1.4189,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.7870916961826053,
34
+ "grad_norm": 8.43055534362793,
35
  "learning_rate": 6.682556450547999e-07,
36
+ "loss": 1.4281,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.9838646202282566,
41
+ "grad_norm": 7.581571578979492,
42
  "learning_rate": 6.088340155816718e-07,
43
+ "loss": 1.4212,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 1.0,
48
+ "eval_accuracy": 0.6224073664009447,
49
+ "eval_loss": 1.4633311033248901,
50
+ "eval_model_preparation_time": 0.0052,
51
+ "eval_runtime": 1196.6375,
52
+ "eval_samples_per_second": 90.574,
53
+ "eval_steps_per_second": 2.83,
54
  "step": 2541
55
  },
56
  {
57
  "epoch": 1.1806375442739079,
58
+ "grad_norm": 8.631559371948242,
59
  "learning_rate": 5.494123861085435e-07,
60
+ "loss": 1.416,
61
  "step": 3000
62
  },
63
  {
64
  "epoch": 1.3774104683195592,
65
+ "grad_norm": 7.313708305358887,
66
  "learning_rate": 4.899907566354153e-07,
67
+ "loss": 1.3983,
68
  "step": 3500
69
  },
70
  {
71
  "epoch": 1.5741833923652107,
72
+ "grad_norm": 8.412739753723145,
73
  "learning_rate": 4.3056912716228705e-07,
74
+ "loss": 1.4022,
75
  "step": 4000
76
  },
77
  {
78
  "epoch": 1.770956316410862,
79
+ "grad_norm": 8.88099479675293,
80
  "learning_rate": 3.7114749768915883e-07,
81
+ "loss": 1.4047,
82
  "step": 4500
83
  },
84
  {
85
  "epoch": 1.9677292404565132,
86
+ "grad_norm": 6.803462505340576,
87
  "learning_rate": 3.117258682160306e-07,
88
+ "loss": 1.3919,
89
  "step": 5000
90
  },
91
  {
92
  "epoch": 2.0,
93
+ "eval_accuracy": 0.6274911426040743,
94
+ "eval_loss": 1.4468485116958618,
95
+ "eval_model_preparation_time": 0.0052,
96
+ "eval_runtime": 1503.5311,
97
+ "eval_samples_per_second": 72.086,
98
+ "eval_steps_per_second": 2.253,
99
  "step": 5082
100
  },
101
  {
102
  "epoch": 2.1645021645021645,
103
+ "grad_norm": 8.684732437133789,
104
  "learning_rate": 2.523042387429024e-07,
105
+ "loss": 1.4015,
106
  "step": 5500
107
  },
108
  {
109
  "epoch": 2.3612750885478158,
110
+ "grad_norm": 9.197487831115723,
111
  "learning_rate": 1.928826092697742e-07,
112
+ "loss": 1.3821,
113
  "step": 6000
114
  },
115
  {
116
  "epoch": 2.558048012593467,
117
+ "grad_norm": 8.341646194458008,
118
  "learning_rate": 1.3346097979664598e-07,
119
+ "loss": 1.3932,
120
  "step": 6500
121
  },
122
  {
123
  "epoch": 2.7548209366391183,
124
+ "grad_norm": 11.383636474609375,
125
  "learning_rate": 7.403935032351777e-08,
126
+ "loss": 1.3943,
127
  "step": 7000
128
  },
129
  {
130
  "epoch": 2.9515938606847696,
131
+ "grad_norm": 7.704733371734619,
132
  "learning_rate": 1.4617720850389543e-08,
133
+ "loss": 1.387,
134
  "step": 7500
135
  },
136
  {
137
  "epoch": 3.0,
138
+ "eval_accuracy": 0.6277218039563035,
139
+ "eval_loss": 1.4409993886947632,
140
+ "eval_model_preparation_time": 0.0052,
141
+ "eval_runtime": 1211.7556,
142
+ "eval_samples_per_second": 89.444,
143
+ "eval_steps_per_second": 2.795,
144
  "step": 7623
145
  }
146
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cce8ab6dbce6287960ea5fdf6432aa92c141bb2348dd8f398cd88288f69143a4
3
  size 343365480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6dc632b36bf1d57de1137187ecb65d61f8d0e7e44da4ff1872166954cf1b27e
3
  size 343365480