ChristosSevastopoulos commited on
Commit
846705b
1 Parent(s): b76fbed

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.9322033898305084,
4
- "eval_loss": 0.1975485384464264,
5
- "eval_runtime": 6.5685,
6
- "eval_samples_per_second": 107.787,
7
- "eval_steps_per_second": 3.502,
8
- "train_loss": 0.39651955127716065,
9
- "train_runtime": 125.6812,
10
- "train_samples_per_second": 50.692,
11
- "train_steps_per_second": 0.398
12
  }
 
1
  {
2
+ "epoch": 0.96,
3
+ "eval_accuracy": 0.7808988764044944,
4
+ "eval_loss": 0.42015063762664795,
5
+ "eval_runtime": 1.8074,
6
+ "eval_samples_per_second": 98.482,
7
+ "eval_steps_per_second": 3.32,
8
+ "train_loss": 0.536445160706838,
9
+ "train_runtime": 48.1684,
10
+ "train_samples_per_second": 33.072,
11
+ "train_steps_per_second": 0.249
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.9322033898305084,
4
- "eval_loss": 0.1975485384464264,
5
- "eval_runtime": 6.5685,
6
- "eval_samples_per_second": 107.787,
7
- "eval_steps_per_second": 3.502
8
  }
 
1
  {
2
+ "epoch": 0.96,
3
+ "eval_accuracy": 0.7808988764044944,
4
+ "eval_loss": 0.42015063762664795,
5
+ "eval_runtime": 1.8074,
6
+ "eval_samples_per_second": 98.482,
7
+ "eval_steps_per_second": 3.32
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a0ca78bcd9a1e3f369d1ad91d1db89e3258756e7ac76884012504904eeb444d
3
  size 110392879
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79f51e55e8676b8121a2da90e540a3c10d0750e9fb53933c01e7cf8b137c354f
3
  size 110392879
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 1.0,
3
- "train_loss": 0.39651955127716065,
4
- "train_runtime": 125.6812,
5
- "train_samples_per_second": 50.692,
6
- "train_steps_per_second": 0.398
7
  }
 
1
  {
2
+ "epoch": 0.96,
3
+ "train_loss": 0.536445160706838,
4
+ "train_runtime": 48.1684,
5
+ "train_samples_per_second": 33.072,
6
+ "train_steps_per_second": 0.249
7
  }
trainer_state.json CHANGED
@@ -1,64 +1,40 @@
1
  {
2
- "best_metric": 0.9322033898305084,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-thecbbbfs/checkpoint-50",
4
- "epoch": 1.0,
5
- "global_step": 50,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
- {
11
- "epoch": 0.2,
12
- "learning_rate": 4.4444444444444447e-05,
13
- "loss": 0.6293,
14
- "step": 10
15
- },
16
- {
17
- "epoch": 0.4,
18
- "learning_rate": 3.3333333333333335e-05,
19
- "loss": 0.3964,
20
- "step": 20
21
- },
22
- {
23
- "epoch": 0.6,
24
- "learning_rate": 2.2222222222222223e-05,
25
- "loss": 0.3323,
26
- "step": 30
27
- },
28
  {
29
  "epoch": 0.8,
30
- "learning_rate": 1.1111111111111112e-05,
31
- "loss": 0.2962,
32
- "step": 40
33
- },
34
- {
35
- "epoch": 1.0,
36
- "learning_rate": 0.0,
37
- "loss": 0.3284,
38
- "step": 50
39
  },
40
  {
41
- "epoch": 1.0,
42
- "eval_accuracy": 0.9322033898305084,
43
- "eval_loss": 0.1975485384464264,
44
- "eval_runtime": 6.4765,
45
- "eval_samples_per_second": 109.318,
46
- "eval_steps_per_second": 3.551,
47
- "step": 50
48
  },
49
  {
50
- "epoch": 1.0,
51
- "step": 50,
52
- "total_flos": 1.5835750582888858e+17,
53
- "train_loss": 0.39651955127716065,
54
- "train_runtime": 125.6812,
55
- "train_samples_per_second": 50.692,
56
- "train_steps_per_second": 0.398
57
  }
58
  ],
59
- "max_steps": 50,
60
  "num_train_epochs": 1,
61
- "total_flos": 1.5835750582888858e+17,
62
  "trial_name": null,
63
  "trial_params": null
64
  }
 
1
  {
2
+ "best_metric": 0.7808988764044944,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-thecbbbfs/checkpoint-12",
4
+ "epoch": 0.96,
5
+ "global_step": 12,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  {
11
  "epoch": 0.8,
12
+ "learning_rate": 1e-05,
13
+ "loss": 0.5544,
14
+ "step": 10
 
 
 
 
 
 
15
  },
16
  {
17
+ "epoch": 0.96,
18
+ "eval_accuracy": 0.7808988764044944,
19
+ "eval_loss": 0.42015063762664795,
20
+ "eval_runtime": 1.717,
21
+ "eval_samples_per_second": 103.671,
22
+ "eval_steps_per_second": 3.495,
23
+ "step": 12
24
  },
25
  {
26
+ "epoch": 0.96,
27
+ "step": 12,
28
+ "total_flos": 3.817879908227482e+16,
29
+ "train_loss": 0.536445160706838,
30
+ "train_runtime": 48.1684,
31
+ "train_samples_per_second": 33.072,
32
+ "train_steps_per_second": 0.249
33
  }
34
  ],
35
+ "max_steps": 12,
36
  "num_train_epochs": 1,
37
+ "total_flos": 3.817879908227482e+16,
38
  "trial_name": null,
39
  "trial_params": null
40
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72559b464d91058686abb1be8ed40c4089986ef36b77e0529b4a827230458bad
3
  size 3375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f17bebf5a79b12e06ac516fe300d857f899cea5d0473210042ca6ddc4eb11b8c
3
  size 3375