typorch commited on
Commit
01731cc
1 Parent(s): 84d6dbd

Upload 3 files

Browse files
Files changed (3) hide show
  1. README.md +12 -0
  2. config.json +40 -0
  3. pytorch_model.bin +3 -0
README.md ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ library_name: timm
4
+ tags:
5
+ - image-feature-extraction
6
+ - timm
7
+ ---
8
+ # Model card for vit_base_patch16_224_waifumerge
9
+
10
+ A Vision Transformer (ViT) image feature model. Trained with Self-Supervised DINO method.
11
+
12
+ [Model Stock](https://github.com/naver-ai/model-stock) merge of *vit_base_patch16_224.dino*, *vit_base_patch16_224.augreg2_in21k_ft_in1k* and *wd-vit-tagger-v3* just to see what would happen ¯\_(ツ)_/¯
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architecture": "vit_base_patch16_224",
3
+ "num_classes": 10861,
4
+ "num_features": 768,
5
+ "global_pool": "avg",
6
+ "model_args": {
7
+ "img_size": 448,
8
+ "class_token": false,
9
+ "global_pool": "avg",
10
+ "fc_norm": false,
11
+ "act_layer": "gelu_tanh"
12
+ },
13
+ "pretrained_cfg": {
14
+ "tag": "waifumerge",
15
+ "custom_load": false,
16
+ "input_size": [
17
+ 3,
18
+ 448,
19
+ 448
20
+ ],
21
+ "fixed_input_size": false,
22
+ "interpolation": "bicubic",
23
+ "crop_pct": 1.0,
24
+ "crop_mode": "center",
25
+ "mean": [
26
+ 0.5,
27
+ 0.5,
28
+ 0.5
29
+ ],
30
+ "std": [
31
+ 0.5,
32
+ 0.5,
33
+ 0.5
34
+ ],
35
+ "num_classes": 10861,
36
+ "pool_size": null,
37
+ "first_conv": null,
38
+ "classifier": null
39
+ }
40
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf570937ea78f75df7c9d95b0b8378e79f2bd90c9b6b79573439f5e0e96ec9e4
3
+ size 343250456