jvadlamudi2 commited on
Commit
dbc8f5e
1 Parent(s): bc9e388

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,8 +1,13 @@
1
  {
2
  "epoch": 3.0,
3
- "total_flos": 6.644005855919309e+16,
4
- "train_loss": 0.6010840450014386,
5
- "train_runtime": 82.3084,
6
- "train_samples_per_second": 32.475,
7
- "train_steps_per_second": 0.255
 
 
 
 
 
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_accuracy": 0.6071428571428571,
4
+ "eval_loss": 0.6862359046936035,
5
+ "eval_runtime": 0.8492,
6
+ "eval_samples_per_second": 131.885,
7
+ "eval_steps_per_second": 4.71,
8
+ "total_flos": 7.471710289148314e+16,
9
+ "train_loss": 0.6844675143559774,
10
+ "train_runtime": 103.9833,
11
+ "train_samples_per_second": 28.908,
12
+ "train_steps_per_second": 0.231
13
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_accuracy": 0.6071428571428571,
4
+ "eval_loss": 0.6862359046936035,
5
+ "eval_runtime": 0.8492,
6
+ "eval_samples_per_second": 131.885,
7
+ "eval_steps_per_second": 4.71
8
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93819f614ab1a7071e3e3d55ec9a7d4ace4d0c3a0a1c70ade6fc49224fb6448c
3
  size 110394865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25a101dde9f32f27810cad590e197ed56f0b94aa1f6df21db8d1ec277f16959
3
  size 110394865
runs/Jul20_19-45-58_fcbe542fc008/events.out.tfevents.1689882673.fcbe542fc008.344.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:508742c08776fe84217d5e5e06b76f830cccabe34dca5a59b176a3e83f86190e
3
+ size 405
runs/Jul20_19-45-58_fcbe542fc008/events.out.tfevents.1689884242.fcbe542fc008.344.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd9df98b3146add3883dcb1fa6f9b09cba1b37fec446a89d5dbe27af2a8de5df
3
+ size 4839
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "total_flos": 6.644005855919309e+16,
4
- "train_loss": 0.6010840450014386,
5
- "train_runtime": 82.3084,
6
- "train_samples_per_second": 32.475,
7
- "train_steps_per_second": 0.255
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "total_flos": 7.471710289148314e+16,
4
+ "train_loss": 0.6844675143559774,
5
+ "train_runtime": 103.9833,
6
+ "train_samples_per_second": 28.908,
7
+ "train_steps_per_second": 0.231
8
  }
trainer_state.json CHANGED
@@ -1,64 +1,64 @@
1
  {
2
- "best_metric": 0.7130044843049327,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-jvadlamudi2/checkpoint-14",
4
  "epoch": 3.0,
5
- "global_step": 21,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 0.6860986547085202,
13
- "eval_loss": 0.5776408314704895,
14
- "eval_runtime": 1.5327,
15
- "eval_samples_per_second": 145.496,
16
- "eval_steps_per_second": 4.567,
17
- "step": 7
18
  },
19
  {
20
- "epoch": 1.43,
21
- "learning_rate": 3.055555555555556e-05,
22
- "loss": 0.6176,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
- "eval_accuracy": 0.7130044843049327,
28
- "eval_loss": 0.5827417969703674,
29
- "eval_runtime": 1.532,
30
- "eval_samples_per_second": 145.559,
31
- "eval_steps_per_second": 4.569,
32
- "step": 14
33
  },
34
  {
35
- "epoch": 2.86,
36
- "learning_rate": 2.777777777777778e-06,
37
- "loss": 0.5847,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
- "eval_accuracy": 0.7040358744394619,
43
- "eval_loss": 0.586353063583374,
44
- "eval_runtime": 1.5413,
45
- "eval_samples_per_second": 144.679,
46
- "eval_steps_per_second": 4.541,
47
- "step": 21
48
  },
49
  {
50
  "epoch": 3.0,
51
- "step": 21,
52
- "total_flos": 6.644005855919309e+16,
53
- "train_loss": 0.6010840450014386,
54
- "train_runtime": 82.3084,
55
- "train_samples_per_second": 32.475,
56
- "train_steps_per_second": 0.255
57
  }
58
  ],
59
- "max_steps": 21,
60
  "num_train_epochs": 3,
61
- "total_flos": 6.644005855919309e+16,
62
  "trial_name": null,
63
  "trial_params": null
64
  }
 
1
  {
2
+ "best_metric": 0.6071428571428571,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-jvadlamudi2/checkpoint-24",
4
  "epoch": 3.0,
5
+ "global_step": 24,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.5892857142857143,
13
+ "eval_loss": 0.7051630616188049,
14
+ "eval_runtime": 0.9526,
15
+ "eval_samples_per_second": 117.567,
16
+ "eval_steps_per_second": 4.199,
17
+ "step": 8
18
  },
19
  {
20
+ "epoch": 1.25,
21
+ "learning_rate": 3.3333333333333335e-05,
22
+ "loss": 0.7036,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
+ "eval_accuracy": 0.5803571428571429,
28
+ "eval_loss": 0.6873636245727539,
29
+ "eval_runtime": 0.7758,
30
+ "eval_samples_per_second": 144.369,
31
+ "eval_steps_per_second": 5.156,
32
+ "step": 16
33
  },
34
  {
35
+ "epoch": 2.5,
36
+ "learning_rate": 9.523809523809523e-06,
37
+ "loss": 0.6691,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
+ "eval_accuracy": 0.6071428571428571,
43
+ "eval_loss": 0.6862359046936035,
44
+ "eval_runtime": 0.8007,
45
+ "eval_samples_per_second": 139.883,
46
+ "eval_steps_per_second": 4.996,
47
+ "step": 24
48
  },
49
  {
50
  "epoch": 3.0,
51
+ "step": 24,
52
+ "total_flos": 7.471710289148314e+16,
53
+ "train_loss": 0.6844675143559774,
54
+ "train_runtime": 103.9833,
55
+ "train_samples_per_second": 28.908,
56
+ "train_steps_per_second": 0.231
57
  }
58
  ],
59
+ "max_steps": 24,
60
  "num_train_epochs": 3,
61
+ "total_flos": 7.471710289148314e+16,
62
  "trial_name": null,
63
  "trial_params": null
64
  }