griffio commited on
Commit
4177d7f
1 Parent(s): bc57055

rotated_maps

Browse files
README.md ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ license: apache-2.0
4
+ base_model: google/vit-large-patch16-224
5
+ tags:
6
+ - image-classification
7
+ - generated_from_trainer
8
+ datasets:
9
+ - imagefolder
10
+ metrics:
11
+ - accuracy
12
+ model-index:
13
+ - name: vit-large-patch16-224-testing-dungeons-lora-23Nov24-0010
14
+ results:
15
+ - task:
16
+ type: image-classification
17
+ name: Image Classification
18
+ dataset:
19
+ name: rotated_maps
20
+ type: imagefolder
21
+ config: default
22
+ split: validation
23
+ args: default
24
+ metrics:
25
+ - type: accuracy
26
+ value: 1.0
27
+ name: Accuracy
28
+ ---
29
+
30
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
31
+ should probably proofread and complete it, then remove this comment. -->
32
+
33
+ # vit-large-patch16-224-testing-dungeons-lora-23Nov24-0010
34
+
35
+ This model is a fine-tuned version of [google/vit-large-patch16-224](https://huggingface.co/google/vit-large-patch16-224) on the rotated_maps dataset.
36
+ It achieves the following results on the evaluation set:
37
+ - Loss: 0.0977
38
+ - Accuracy: 1.0
39
+
40
+ ## Model description
41
+
42
+ More information needed
43
+
44
+ ## Intended uses & limitations
45
+
46
+ More information needed
47
+
48
+ ## Training and evaluation data
49
+
50
+ More information needed
51
+
52
+ ## Training procedure
53
+
54
+ ### Training hyperparameters
55
+
56
+ The following hyperparameters were used during training:
57
+ - learning_rate: 0.005
58
+ - train_batch_size: 8
59
+ - eval_batch_size: 8
60
+ - seed: 42
61
+ - gradient_accumulation_steps: 4
62
+ - total_train_batch_size: 32
63
+ - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
64
+ - lr_scheduler_type: linear
65
+ - lr_scheduler_warmup_ratio: 0.1
66
+ - num_epochs: 12
67
+ - mixed_precision_training: Native AMP
68
+
69
+ ### Training results
70
+
71
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy |
72
+ |:-------------:|:------:|:----:|:---------------:|:--------:|
73
+ | No log | 0.6667 | 1 | 1.4309 | 0.2963 |
74
+ | No log | 2.0 | 3 | 1.1590 | 0.5926 |
75
+ | No log | 2.6667 | 4 | 0.7057 | 0.8148 |
76
+ | No log | 4.0 | 6 | 0.4692 | 0.8148 |
77
+ | No log | 4.6667 | 7 | 0.2285 | 0.9630 |
78
+ | No log | 6.0 | 9 | 0.2492 | 0.8889 |
79
+ | 0.7456 | 6.6667 | 10 | 0.1295 | 1.0 |
80
+ | 0.7456 | 8.0 | 12 | 0.0977 | 1.0 |
81
+
82
+
83
+ ### Framework versions
84
+
85
+ - PEFT 0.13.2
86
+ - Transformers 4.46.2
87
+ - Pytorch 2.5.1+cu121
88
+ - Datasets 3.1.0
89
+ - Tokenizers 0.20.3
adapter_config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "ViTForImageClassification",
5
+ "parent_library": "transformers.models.vit.modeling_vit"
6
+ },
7
+ "base_model_name_or_path": "google/vit-large-patch16-224",
8
+ "bias": "none",
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": true,
12
+ "layer_replication": null,
13
+ "layers_pattern": null,
14
+ "layers_to_transform": null,
15
+ "loftq_config": {},
16
+ "lora_alpha": 16,
17
+ "lora_dropout": 0.1,
18
+ "megatron_config": null,
19
+ "megatron_core": "megatron.core",
20
+ "modules_to_save": [
21
+ "classifier"
22
+ ],
23
+ "peft_type": "LORA",
24
+ "r": 16,
25
+ "rank_pattern": {},
26
+ "revision": null,
27
+ "target_modules": [
28
+ "value",
29
+ "query"
30
+ ],
31
+ "task_type": null,
32
+ "use_dora": false,
33
+ "use_rslora": false
34
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b45fee3aa8b61fa2714b9aabc42c5bbaff527e76300ae153feb0edf518e5a24f
3
+ size 6322120
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.09772621840238571,
5
+ "eval_runtime": 0.4904,
6
+ "eval_samples_per_second": 55.057,
7
+ "eval_steps_per_second": 8.157
8
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.09772621840238571,
5
+ "eval_runtime": 0.4904,
6
+ "eval_samples_per_second": 55.057,
7
+ "eval_steps_per_second": 8.157
8
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_rescale": false,
4
+ "do_resize": true,
5
+ "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
+ ],
10
+ "image_processor_type": "ViTImageProcessor",
11
+ "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "resample": 2,
17
+ "rescale_factor": 0.00392156862745098,
18
+ "size": {
19
+ "height": 224,
20
+ "width": 224
21
+ }
22
+ }
runs/Nov23_19-27-38_f5335f7c91c7/events.out.tfevents.1732390070.f5335f7c91c7.462.22 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a46bd592549f127711201fc414a6cb98a26ed47bbde53b7e0a662bc48ca0b33
3
+ size 8346
runs/Nov23_19-28-27_f5335f7c91c7/events.out.tfevents.1732390116.f5335f7c91c7.462.23 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21ef2542792c6ff575938955c0c424217107940891f271c284ce01aa58fb3dc2
3
+ size 8346
runs/Nov23_19-28-27_f5335f7c91c7/events.out.tfevents.1732390138.f5335f7c91c7.462.24 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bec1eb12c87c1d855adc64685621e3ae394a5605c4ecae8266f1fb994f866bbf
3
+ size 405
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92968979adb1fac874017df34bd2ab561ee7041348e06298193ba690a9e5a14
3
+ size 5368