rijusougata13 commited on
Commit
94aa354
1 Parent(s): dcdfb48

Training in progress, epoch 6

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.7880986937590712,
4
- "eval_loss": 0.5690365433692932,
5
- "eval_runtime": 34.5814,
6
- "eval_samples_per_second": 39.848,
7
- "eval_steps_per_second": 1.272,
8
- "total_flos": 9.244220036417372e+17,
9
- "train_loss": 0.4883061381140116,
10
- "train_runtime": 824.2717,
11
- "train_samples_per_second": 45.116,
12
- "train_steps_per_second": 0.353
13
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.8084179970972424,
4
+ "eval_loss": 0.5213053226470947,
5
+ "eval_runtime": 34.1734,
6
+ "eval_samples_per_second": 40.324,
7
+ "eval_steps_per_second": 1.288,
8
+ "total_flos": 1.5407033394028954e+18,
9
+ "train_loss": 0.25417212948356704,
10
+ "train_runtime": 754.4258,
11
+ "train_samples_per_second": 82.155,
12
+ "train_steps_per_second": 0.643
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.7880986937590712,
4
- "eval_loss": 0.5690365433692932,
5
- "eval_runtime": 34.5814,
6
- "eval_samples_per_second": 39.848,
7
- "eval_steps_per_second": 1.272
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.8084179970972424,
4
+ "eval_loss": 0.5213053226470947,
5
+ "eval_runtime": 34.1734,
6
+ "eval_samples_per_second": 40.324,
7
+ "eval_steps_per_second": 1.288
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:904ab153a33d8ef1bfe0e4766d15493636392f11a420eec77d91ab1e1343fa78
3
  size 110352060
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:319ff3acee313dc8a0ac65b91528f4931298f23767e217e3f39b64886437b1bb
3
  size 110352060
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 9.244220036417372e+17,
4
- "train_loss": 0.4883061381140116,
5
- "train_runtime": 824.2717,
6
- "train_samples_per_second": 45.116,
7
- "train_steps_per_second": 0.353
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "total_flos": 1.5407033394028954e+18,
4
+ "train_loss": 0.25417212948356704,
5
+ "train_runtime": 754.4258,
6
+ "train_samples_per_second": 82.155,
7
+ "train_steps_per_second": 0.643
8
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.7880986937590712,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-291",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 291,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -210,20 +210,152 @@
210
  "step": 291
211
  },
212
  {
213
- "epoch": 3.0,
214
- "step": 291,
215
- "total_flos": 9.244220036417372e+17,
216
- "train_loss": 0.4883061381140116,
217
- "train_runtime": 824.2717,
218
- "train_samples_per_second": 45.116,
219
- "train_steps_per_second": 0.353
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
220
  }
221
  ],
222
  "logging_steps": 10,
223
- "max_steps": 291,
224
- "num_train_epochs": 3,
225
  "save_steps": 500,
226
- "total_flos": 9.244220036417372e+17,
227
  "trial_name": null,
228
  "trial_params": null
229
  }
 
1
  {
2
+ "best_metric": 0.8084179970972424,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-485",
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 485,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
210
  "step": 291
211
  },
212
  {
213
+ "epoch": 3.09,
214
+ "learning_rate": 2.1215596330275232e-05,
215
+ "loss": 0.6839,
216
+ "step": 300
217
+ },
218
+ {
219
+ "epoch": 3.2,
220
+ "learning_rate": 2.006880733944954e-05,
221
+ "loss": 0.6814,
222
+ "step": 310
223
+ },
224
+ {
225
+ "epoch": 3.3,
226
+ "learning_rate": 1.8922018348623855e-05,
227
+ "loss": 0.6358,
228
+ "step": 320
229
+ },
230
+ {
231
+ "epoch": 3.4,
232
+ "learning_rate": 1.7775229357798164e-05,
233
+ "loss": 0.6343,
234
+ "step": 330
235
+ },
236
+ {
237
+ "epoch": 3.51,
238
+ "learning_rate": 1.662844036697248e-05,
239
+ "loss": 0.6434,
240
+ "step": 340
241
+ },
242
+ {
243
+ "epoch": 3.61,
244
+ "learning_rate": 1.548165137614679e-05,
245
+ "loss": 0.6701,
246
+ "step": 350
247
+ },
248
+ {
249
+ "epoch": 3.71,
250
+ "learning_rate": 1.4334862385321102e-05,
251
+ "loss": 0.6605,
252
+ "step": 360
253
+ },
254
+ {
255
+ "epoch": 3.81,
256
+ "learning_rate": 1.3188073394495412e-05,
257
+ "loss": 0.6269,
258
+ "step": 370
259
+ },
260
+ {
261
+ "epoch": 3.92,
262
+ "learning_rate": 1.2041284403669725e-05,
263
+ "loss": 0.6522,
264
+ "step": 380
265
+ },
266
+ {
267
+ "epoch": 4.0,
268
+ "eval_accuracy": 0.7968069666182874,
269
+ "eval_loss": 0.5324537754058838,
270
+ "eval_runtime": 34.108,
271
+ "eval_samples_per_second": 40.401,
272
+ "eval_steps_per_second": 1.29,
273
+ "step": 388
274
+ },
275
+ {
276
+ "epoch": 4.02,
277
+ "learning_rate": 1.0894495412844036e-05,
278
+ "loss": 0.6545,
279
+ "step": 390
280
+ },
281
+ {
282
+ "epoch": 4.12,
283
+ "learning_rate": 9.74770642201835e-06,
284
+ "loss": 0.6333,
285
+ "step": 400
286
+ },
287
+ {
288
+ "epoch": 4.23,
289
+ "learning_rate": 8.600917431192661e-06,
290
+ "loss": 0.5846,
291
+ "step": 410
292
+ },
293
+ {
294
+ "epoch": 4.33,
295
+ "learning_rate": 7.454128440366973e-06,
296
+ "loss": 0.6449,
297
+ "step": 420
298
+ },
299
+ {
300
+ "epoch": 4.43,
301
+ "learning_rate": 6.3073394495412846e-06,
302
+ "loss": 0.586,
303
+ "step": 430
304
+ },
305
+ {
306
+ "epoch": 4.54,
307
+ "learning_rate": 5.160550458715597e-06,
308
+ "loss": 0.6197,
309
+ "step": 440
310
+ },
311
+ {
312
+ "epoch": 4.64,
313
+ "learning_rate": 4.013761467889909e-06,
314
+ "loss": 0.5752,
315
+ "step": 450
316
+ },
317
+ {
318
+ "epoch": 4.74,
319
+ "learning_rate": 2.8669724770642206e-06,
320
+ "loss": 0.6203,
321
+ "step": 460
322
+ },
323
+ {
324
+ "epoch": 4.85,
325
+ "learning_rate": 1.7201834862385322e-06,
326
+ "loss": 0.6595,
327
+ "step": 470
328
+ },
329
+ {
330
+ "epoch": 4.95,
331
+ "learning_rate": 5.733944954128441e-07,
332
+ "loss": 0.6189,
333
+ "step": 480
334
+ },
335
+ {
336
+ "epoch": 5.0,
337
+ "eval_accuracy": 0.8084179970972424,
338
+ "eval_loss": 0.5213053226470947,
339
+ "eval_runtime": 34.2264,
340
+ "eval_samples_per_second": 40.261,
341
+ "eval_steps_per_second": 1.286,
342
+ "step": 485
343
+ },
344
+ {
345
+ "epoch": 5.0,
346
+ "step": 485,
347
+ "total_flos": 1.5407033394028954e+18,
348
+ "train_loss": 0.25417212948356704,
349
+ "train_runtime": 754.4258,
350
+ "train_samples_per_second": 82.155,
351
+ "train_steps_per_second": 0.643
352
  }
353
  ],
354
  "logging_steps": 10,
355
+ "max_steps": 485,
356
+ "num_train_epochs": 5,
357
  "save_steps": 500,
358
+ "total_flos": 1.5407033394028954e+18,
359
  "trial_name": null,
360
  "trial_params": null
361
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b731c7fb02690e62840d5fde0f3f479264c690e9befb062d41e3f9d1b5f143a1
3
  size 4219
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f699c4d6e1218ced6a2b6d295a8eaf205ad55fdd9d20805536e894a146aad539
3
  size 4219