cvt-13-finetuned-ibird / config.json
hemlatachanne's picture
Training in progress, epoch 0
fb65410 verified
raw
history blame
2.7 kB
{
"_name_or_path": "microsoft/cvt-13",
"architectures": [
"CvtForImageClassification"
],
"attention_drop_rate": [
0.0,
0.0,
0.0
],
"cls_token": [
false,
false,
true
],
"depth": [
1,
2,
10
],
"drop_path_rate": [
0.0,
0.0,
0.1
],
"drop_rate": [
0.0,
0.0,
0.0
],
"embed_dim": [
64,
192,
384
],
"id2label": {
"0": "Asian Green Bee-Eater",
"1": "Brown-Headed Barbet",
"2": "Cattle Egret",
"3": "Common Kingfisher",
"4": "Common Myna",
"5": "Common Rosefinch",
"6": "Common Tailorbird",
"7": "Coppersmith Barbet",
"8": "Forest Wagtail",
"9": "Gray Wagtail",
"10": "Hoopoe",
"11": "House Crow",
"12": "Indian Grey Hornbill",
"13": "Indian Peacock",
"14": "Indian Pitta",
"15": "Indian Roller",
"16": "Jungle Babbler",
"17": "Northern Lapwing",
"18": "Red-Wattled Lapwing",
"19": "Ruddy Shelduck",
"20": "Rufous Treepie",
"21": "Sarus Crane",
"22": "White Wagtail",
"23": "White-Breasted Kingfisher",
"24": "White-Breasted Waterhen"
},
"image_size": 224,
"initializer_range": 0.02,
"kernel_qkv": [
3,
3,
3
],
"label2id": {
"Asian Green Bee-Eater": 0,
"Brown-Headed Barbet": 1,
"Cattle Egret": 2,
"Common Kingfisher": 3,
"Common Myna": 4,
"Common Rosefinch": 5,
"Common Tailorbird": 6,
"Coppersmith Barbet": 7,
"Forest Wagtail": 8,
"Gray Wagtail": 9,
"Hoopoe": 10,
"House Crow": 11,
"Indian Grey Hornbill": 12,
"Indian Peacock": 13,
"Indian Pitta": 14,
"Indian Roller": 15,
"Jungle Babbler": 16,
"Northern Lapwing": 17,
"Red-Wattled Lapwing": 18,
"Ruddy Shelduck": 19,
"Rufous Treepie": 20,
"Sarus Crane": 21,
"White Wagtail": 22,
"White-Breasted Kingfisher": 23,
"White-Breasted Waterhen": 24
},
"layer_norm_eps": 1e-12,
"mlp_ratio": [
4.0,
4.0,
4.0
],
"model_type": "cvt",
"num_channels": 3,
"num_heads": [
1,
3,
6
],
"num_stages": 3,
"padding_kv": [
1,
1,
1
],
"padding_q": [
1,
1,
1
],
"patch_padding": [
2,
1,
1
],
"patch_sizes": [
7,
3,
3
],
"patch_stride": [
4,
2,
2
],
"pos_embed": [
false,
false,
false
],
"problem_type": "single_label_classification",
"qkv_bias": [
true,
true,
true
],
"qkv_projection_method": [
"dw_bn",
"dw_bn",
"dw_bn"
],
"stride_kv": [
2,
2,
2
],
"stride_q": [
1,
1,
1
],
"torch_dtype": "float32",
"transformers_version": "4.38.2"
}