pkr7098 commited on
Commit
8e29bb5
1 Parent(s): aee3386

End of training

Browse files
README.md CHANGED
@@ -3,6 +3,8 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
 
 
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
@@ -16,10 +18,10 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # vit-cifar100-cifar100
18
 
19
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Accuracy: 0.9241
22
  - Loss: 0.2955
 
23
 
24
  ## Model description
25
 
 
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
6
+ - image-classification
7
+ - vision
8
  - generated_from_trainer
9
  metrics:
10
  - accuracy
 
18
 
19
  # vit-cifar100-cifar100
20
 
21
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the cifar100 dataset.
22
  It achieves the following results on the evaluation set:
 
23
  - Loss: 0.2955
24
+ - Accuracy: 0.9241
25
 
26
  ## Model description
27
 
all_results.json CHANGED
@@ -2,12 +2,12 @@
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9241333333333334,
4
  "eval_loss": 0.2954551577568054,
5
- "eval_runtime": 121.8517,
6
- "eval_samples_per_second": 61.55,
7
- "eval_steps_per_second": 7.698,
8
  "total_flos": 1.64815115092992e+19,
9
- "train_loss": 1.1898613937197713,
10
- "train_runtime": 10288.1641,
11
- "train_samples_per_second": 20.655,
12
- "train_steps_per_second": 2.582
13
  }
 
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9241333333333334,
4
  "eval_loss": 0.2954551577568054,
5
+ "eval_runtime": 26.7539,
6
+ "eval_samples_per_second": 280.333,
7
+ "eval_steps_per_second": 35.06,
8
  "total_flos": 1.64815115092992e+19,
9
+ "train_loss": 0.0,
10
+ "train_runtime": 0.0821,
11
+ "train_samples_per_second": 2587573.233,
12
+ "train_steps_per_second": 323477.096
13
  }
config.json CHANGED
@@ -222,6 +222,7 @@
222
  "num_channels": 3,
223
  "num_hidden_layers": 12,
224
  "patch_size": 16,
 
225
  "qkv_bias": true,
226
  "torch_dtype": "float32",
227
  "transformers_version": "4.44.2"
 
222
  "num_channels": 3,
223
  "num_hidden_layers": 12,
224
  "patch_size": 16,
225
+ "problem_type": "single_label_classification",
226
  "qkv_bias": true,
227
  "torch_dtype": "float32",
228
  "transformers_version": "4.44.2"
eval_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9241333333333334,
4
  "eval_loss": 0.2954551577568054,
5
- "eval_runtime": 121.8517,
6
- "eval_samples_per_second": 61.55,
7
- "eval_steps_per_second": 7.698
8
  }
 
2
  "epoch": 5.0,
3
  "eval_accuracy": 0.9241333333333334,
4
  "eval_loss": 0.2954551577568054,
5
+ "eval_runtime": 26.7539,
6
+ "eval_samples_per_second": 280.333,
7
+ "eval_steps_per_second": 35.06
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
  "total_flos": 1.64815115092992e+19,
4
- "train_loss": 1.1898613937197713,
5
- "train_runtime": 10288.1641,
6
- "train_samples_per_second": 20.655,
7
- "train_steps_per_second": 2.582
8
  }
 
1
  {
2
  "epoch": 5.0,
3
  "total_flos": 1.64815115092992e+19,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 0.0821,
6
+ "train_samples_per_second": 2587573.233,
7
+ "train_steps_per_second": 323477.096
8
  }
trainer_state.json CHANGED
@@ -18649,10 +18649,10 @@
18649
  "epoch": 5.0,
18650
  "step": 26565,
18651
  "total_flos": 1.64815115092992e+19,
18652
- "train_loss": 1.1898613937197713,
18653
- "train_runtime": 10288.1641,
18654
- "train_samples_per_second": 20.655,
18655
- "train_steps_per_second": 2.582
18656
  }
18657
  ],
18658
  "logging_steps": 10,
 
18649
  "epoch": 5.0,
18650
  "step": 26565,
18651
  "total_flos": 1.64815115092992e+19,
18652
+ "train_loss": 0.0,
18653
+ "train_runtime": 0.0821,
18654
+ "train_samples_per_second": 2587573.233,
18655
+ "train_steps_per_second": 323477.096
18656
  }
18657
  ],
18658
  "logging_steps": 10,