{ "_name_or_path": "dandelin/vilt-b32-finetuned-vqa", "architectures": [ "ViltForQuestionAnswering" ], "attention_probs_dropout_prob": 0.0, "hidden_act": "gelu", "hidden_dropout_prob": 0.0, "hidden_size": 768, "id2label": { "0": "Orange", "1": "Boys", "2": "Briefs", "3": "Men", "4": "Cream", "5": "Grey Melange", "6": "Watches", "7": "Suspenders", "8": "Necklace and Chains", "9": "Brown", "10": "Bronze", "11": "Caps", "12": "Sandals", "13": "Ties", "14": "Shirts", "15": "Taupe", "16": "Blue", "17": "Beige", "18": "Sports", "19": "Khaki", "20": "Pink", "21": "Track Pants", "22": "Casual Shoes", "23": "Lounge Shorts", "24": "Formal", "25": "Steel", "26": "Tops", "27": "Heels", "28": "Jumpsuit", "29": "Capris", "30": "Leggings", "31": "Charcoal", "32": "Turquoise Blue", "33": "Lavender", "34": "Camisoles", "35": "Winter", "36": "Navy Blue", "37": "Nightdress", "38": "Women", "39": "Coffee Brown", "40": "Skirts", "41": "Boxers", "42": "Purple", "43": "Innerwear Vests", "44": "Peach", "45": "Multi", "46": "nan", "47": "Fall", "48": "Sports Shoes", "49": "Nude", "50": "Sweaters", "51": "Gold", "52": "Gloves", "53": "Unisex", "54": "Night suits", "55": "Dresses", "56": "Maroon", "57": "Formal Shoes", "58": "Jackets", "59": "Stockings", "60": "Booties", "61": "Shorts", "62": "Tunics", "63": "Waist Pouch", "64": "Tan", "65": "Bra", "66": "Smart Casual", "67": "Tracksuits", "68": "Flip Flops", "69": "Sunglasses", "70": "Summer", "71": "Handbags", "72": "Off White", "73": "Girls", "74": "Socks", "75": "Spring", "76": "Silver", "77": "Belts", "78": "Mustard", "79": "Trousers", "80": "Jeans", "81": "Olive", "82": "Bath Robe", "83": "Bangle", "84": "Yellow", "85": "Scarves", "86": "Mauve", "87": "Sports Sandals", "88": "Trunk", "89": "Green", "90": "Blazers", "91": "Casual", "92": "Flats", "93": "Duffel Bag", "94": "Rust", "95": "Magenta", "96": "Ethnic", "97": "Sweatshirts", "98": "Jeggings", "99": "Grey", "100": "Teal", "101": "Bracelet", "102": "Tshirts", "103": "Black", "104": "White", "105": "Copper", "106": "Red" }, "image_size": 384, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "Bangle": 83, "Bath Robe": 82, "Beige": 17, "Belts": 77, "Black": 103, "Blazers": 90, "Blue": 16, "Booties": 60, "Boxers": 41, "Boys": 1, "Bra": 65, "Bracelet": 101, "Briefs": 2, "Bronze": 10, "Brown": 9, "Camisoles": 34, "Capris": 29, "Caps": 11, "Casual": 91, "Casual Shoes": 22, "Charcoal": 31, "Coffee Brown": 39, "Copper": 105, "Cream": 4, "Dresses": 55, "Duffel Bag": 93, "Ethnic": 96, "Fall": 47, "Flats": 92, "Flip Flops": 68, "Formal": 24, "Formal Shoes": 57, "Girls": 73, "Gloves": 52, "Gold": 51, "Green": 89, "Grey": 99, "Grey Melange": 5, "Handbags": 71, "Heels": 27, "Innerwear Vests": 43, "Jackets": 58, "Jeans": 80, "Jeggings": 98, "Jumpsuit": 28, "Khaki": 19, "Lavender": 33, "Leggings": 30, "Lounge Shorts": 23, "Magenta": 95, "Maroon": 56, "Mauve": 86, "Men": 3, "Multi": 45, "Mustard": 78, "Navy Blue": 36, "Necklace and Chains": 8, "Night suits": 54, "Nightdress": 37, "Nude": 49, "Off White": 72, "Olive": 81, "Orange": 0, "Peach": 44, "Pink": 20, "Purple": 42, "Red": 106, "Rust": 94, "Sandals": 12, "Scarves": 85, "Shirts": 14, "Shorts": 61, "Silver": 76, "Skirts": 40, "Smart Casual": 66, "Socks": 74, "Sports": 18, "Sports Sandals": 87, "Sports Shoes": 48, "Spring": 75, "Steel": 25, "Stockings": 59, "Summer": 70, "Sunglasses": 69, "Suspenders": 7, "Sweaters": 50, "Sweatshirts": 97, "Tan": 64, "Taupe": 15, "Teal": 100, "Ties": 13, "Tops": 26, "Track Pants": 21, "Tracksuits": 67, "Trousers": 79, "Trunk": 88, "Tshirts": 102, "Tunics": 62, "Turquoise Blue": 32, "Unisex": 53, "Waist Pouch": 63, "Watches": 6, "White": 104, "Winter": 35, "Women": 38, "Yellow": 84, "nan": 46 }, "layer_norm_eps": 1e-12, "max_image_length": -1, "max_position_embeddings": 40, "modality_type_vocab_size": 2, "model_type": "vilt", "num_attention_heads": 12, "num_channels": 3, "num_hidden_layers": 12, "num_images": -1, "patch_size": 32, "qkv_bias": true, "tie_word_embeddings": false, "torch_dtype": "float32", "transformers_version": "4.44.2", "type_vocab_size": 2, "vocab_size": 30522 }