|
{
|
|
"_name_or_path": "dandelin/vilt-b32-mlm",
|
|
"architectures": [
|
|
"ViltForQuestionAnswering"
|
|
],
|
|
"attention_probs_dropout_prob": 0.0,
|
|
"hidden_act": "gelu",
|
|
"hidden_dropout_prob": 0.0,
|
|
"hidden_size": 768,
|
|
"id2label": {
|
|
"0": "love",
|
|
"1": "trash",
|
|
"2": "mcdonald's",
|
|
"3": "grazing",
|
|
"4": "20",
|
|
"5": "cows",
|
|
"6": "no",
|
|
"7": "2",
|
|
"8": "1",
|
|
"9": "red white and blue",
|
|
"10": "tank",
|
|
"11": "magnet",
|
|
"12": "surfing",
|
|
"13": "sun",
|
|
"14": "purse",
|
|
"15": "teddy bear",
|
|
"16": "square",
|
|
"17": "9",
|
|
"18": "cycling",
|
|
"19": "green and white",
|
|
"20": "gray and red",
|
|
"21": "lace",
|
|
"22": "uk",
|
|
"23": "warmth",
|
|
"24": "court",
|
|
"25": "green",
|
|
"26": "bus",
|
|
"27": "america",
|
|
"28": "mouse",
|
|
"29": "paddle boarding",
|
|
"30": "boat",
|
|
"31": "playing",
|
|
"32": "40",
|
|
"33": "toothbrush",
|
|
"34": "black white",
|
|
"35": "yes",
|
|
"36": "inside",
|
|
"37": "squares",
|
|
"38": "air",
|
|
"39": "refrigerator",
|
|
"40": "buildings",
|
|
"41": "several",
|
|
"42": "catch frisbee",
|
|
"43": "playing video games",
|
|
"44": "39",
|
|
"45": "bridge",
|
|
"46": "germany",
|
|
"47": "angry",
|
|
"48": "broccoli",
|
|
"49": "diamonds",
|
|
"50": "nowhere",
|
|
"51": "not",
|
|
"52": "brick",
|
|
"53": "laptops",
|
|
"54": "sand",
|
|
"55": "frame",
|
|
"56": "frisbee",
|
|
"57": "pitching",
|
|
"58": "windsurfing",
|
|
"59": "pole",
|
|
"60": "train",
|
|
"61": "bikes",
|
|
"62": "mets",
|
|
"63": "wood",
|
|
"64": "food",
|
|
"65": "tree",
|
|
"66": "curtain",
|
|
"67": "carpet",
|
|
"68": "racing",
|
|
"69": "backpack",
|
|
"70": "tile",
|
|
"71": "man",
|
|
"72": "lines",
|
|
"73": "colored",
|
|
"74": "nothing",
|
|
"75": "waiting",
|
|
"76": "room",
|
|
"77": "paint",
|
|
"78": "stuffed animal",
|
|
"79": "us",
|
|
"80": "8",
|
|
"81": "skateboard",
|
|
"82": "hallway",
|
|
"83": "don't know",
|
|
"84": "black and white",
|
|
"85": "paddling",
|
|
"86": "4",
|
|
"87": "50",
|
|
"88": "relaxing",
|
|
"89": "painting",
|
|
"90": "safety",
|
|
"91": "21",
|
|
"92": "clear",
|
|
"93": "privacy",
|
|
"94": "16",
|
|
"95": "poles",
|
|
"96": "tennis",
|
|
"97": "canopy",
|
|
"98": "never",
|
|
"99": "hexagon",
|
|
"100": "for fun",
|
|
"101": "travel",
|
|
"102": "remote",
|
|
"103": "gravel",
|
|
"104": "blue and red",
|
|
"105": "salt",
|
|
"106": "living room",
|
|
"107": "dirt",
|
|
"108": "posing",
|
|
"109": "tired",
|
|
"110": "sunny",
|
|
"111": "cold",
|
|
"112": "dog",
|
|
"113": "plane",
|
|
"114": "red",
|
|
"115": "board",
|
|
"116": "unsure",
|
|
"117": "airplane",
|
|
"118": "wall",
|
|
"119": "octagon",
|
|
"120": "standing",
|
|
"121": "hotel",
|
|
"122": "white and red",
|
|
"123": "working",
|
|
"124": "pasta",
|
|
"125": "no light",
|
|
"126": "surfboard",
|
|
"127": "airport",
|
|
"128": "white and black",
|
|
"129": "lights",
|
|
"130": "lot",
|
|
"131": "park",
|
|
"132": "tracks",
|
|
"133": "playing frisbee",
|
|
"134": "glasses",
|
|
"135": "38",
|
|
"136": "plants",
|
|
"137": "usa",
|
|
"138": "dell",
|
|
"139": "0",
|
|
"140": "can't tell",
|
|
"141": "people",
|
|
"142": "fabric",
|
|
"143": "yellow",
|
|
"144": "on sidewalk",
|
|
"145": "straw",
|
|
"146": "playing game",
|
|
"147": "concentration",
|
|
"148": "red and white",
|
|
"149": "shade",
|
|
"150": "in car",
|
|
"151": "black",
|
|
"152": "white",
|
|
"153": "sunglasses",
|
|
"154": "glass",
|
|
"155": "comfort",
|
|
"156": "gray",
|
|
"157": "remote control",
|
|
"158": "fridge",
|
|
"159": "parasailing",
|
|
"160": "sleeping",
|
|
"161": "fruit",
|
|
"162": "spoon",
|
|
"163": "skis",
|
|
"164": "many",
|
|
"165": "freezer",
|
|
"166": "25",
|
|
"167": "jeans",
|
|
"168": "branches",
|
|
"169": "looking out window",
|
|
"170": "car",
|
|
"171": "traffic",
|
|
"172": "banana",
|
|
"173": "water",
|
|
"174": "race",
|
|
"175": "15",
|
|
"176": "tennis court",
|
|
"177": "wii",
|
|
"178": "highway",
|
|
"179": "copyright",
|
|
"180": "ground",
|
|
"181": "smile",
|
|
"182": "diamond",
|
|
"183": "fun",
|
|
"184": "home",
|
|
"185": "throwing frisbee",
|
|
"186": "bush",
|
|
"187": "computers",
|
|
"188": "indoors",
|
|
"189": "kicking",
|
|
"190": "unknown",
|
|
"191": "not sure",
|
|
"192": "ski poles",
|
|
"193": "bananas",
|
|
"194": "noodles",
|
|
"195": "catching frisbee",
|
|
"196": "fruits",
|
|
"197": "net",
|
|
"198": "eating",
|
|
"199": "england",
|
|
"200": "grass",
|
|
"201": "british",
|
|
"202": "red and gray",
|
|
"203": "woods",
|
|
"204": "united states",
|
|
"205": "windows",
|
|
"206": "blue",
|
|
"207": "red and blue",
|
|
"208": "taking picture",
|
|
"209": "australia",
|
|
"210": "hay",
|
|
"211": "junk"
|
|
},
|
|
"image_size": 384,
|
|
"initializer_range": 0.02,
|
|
"intermediate_size": 3072,
|
|
"label2id": {
|
|
"0": 139,
|
|
"1": 8,
|
|
"15": 175,
|
|
"16": 94,
|
|
"2": 7,
|
|
"20": 4,
|
|
"21": 91,
|
|
"25": 166,
|
|
"38": 135,
|
|
"39": 44,
|
|
"4": 86,
|
|
"40": 32,
|
|
"50": 87,
|
|
"8": 80,
|
|
"9": 17,
|
|
"air": 38,
|
|
"airplane": 117,
|
|
"airport": 127,
|
|
"america": 27,
|
|
"angry": 47,
|
|
"australia": 209,
|
|
"backpack": 69,
|
|
"banana": 172,
|
|
"bananas": 193,
|
|
"bikes": 61,
|
|
"black": 151,
|
|
"black and white": 84,
|
|
"black white": 34,
|
|
"blue": 206,
|
|
"blue and red": 104,
|
|
"board": 115,
|
|
"boat": 30,
|
|
"branches": 168,
|
|
"brick": 52,
|
|
"bridge": 45,
|
|
"british": 201,
|
|
"broccoli": 48,
|
|
"buildings": 40,
|
|
"bus": 26,
|
|
"bush": 186,
|
|
"can't tell": 140,
|
|
"canopy": 97,
|
|
"car": 170,
|
|
"carpet": 67,
|
|
"catch frisbee": 42,
|
|
"catching frisbee": 195,
|
|
"clear": 92,
|
|
"cold": 111,
|
|
"colored": 73,
|
|
"comfort": 155,
|
|
"computers": 187,
|
|
"concentration": 147,
|
|
"copyright": 179,
|
|
"court": 24,
|
|
"cows": 5,
|
|
"curtain": 66,
|
|
"cycling": 18,
|
|
"dell": 138,
|
|
"diamond": 182,
|
|
"diamonds": 49,
|
|
"dirt": 107,
|
|
"dog": 112,
|
|
"don't know": 83,
|
|
"eating": 198,
|
|
"england": 199,
|
|
"fabric": 142,
|
|
"food": 64,
|
|
"for fun": 100,
|
|
"frame": 55,
|
|
"freezer": 165,
|
|
"fridge": 158,
|
|
"frisbee": 56,
|
|
"fruit": 161,
|
|
"fruits": 196,
|
|
"fun": 183,
|
|
"germany": 46,
|
|
"glass": 154,
|
|
"glasses": 134,
|
|
"grass": 200,
|
|
"gravel": 103,
|
|
"gray": 156,
|
|
"gray and red": 20,
|
|
"grazing": 3,
|
|
"green": 25,
|
|
"green and white": 19,
|
|
"ground": 180,
|
|
"hallway": 82,
|
|
"hay": 210,
|
|
"hexagon": 99,
|
|
"highway": 178,
|
|
"home": 184,
|
|
"hotel": 121,
|
|
"in car": 150,
|
|
"indoors": 188,
|
|
"inside": 36,
|
|
"jeans": 167,
|
|
"junk": 211,
|
|
"kicking": 189,
|
|
"lace": 21,
|
|
"laptops": 53,
|
|
"lights": 129,
|
|
"lines": 72,
|
|
"living room": 106,
|
|
"looking out window": 169,
|
|
"lot": 130,
|
|
"love": 0,
|
|
"magnet": 11,
|
|
"man": 71,
|
|
"many": 164,
|
|
"mcdonald's": 2,
|
|
"mets": 62,
|
|
"mouse": 28,
|
|
"net": 197,
|
|
"never": 98,
|
|
"no": 6,
|
|
"no light": 125,
|
|
"noodles": 194,
|
|
"not": 51,
|
|
"not sure": 191,
|
|
"nothing": 74,
|
|
"nowhere": 50,
|
|
"octagon": 119,
|
|
"on sidewalk": 144,
|
|
"paddle boarding": 29,
|
|
"paddling": 85,
|
|
"paint": 77,
|
|
"painting": 89,
|
|
"parasailing": 159,
|
|
"park": 131,
|
|
"pasta": 124,
|
|
"people": 141,
|
|
"pitching": 57,
|
|
"plane": 113,
|
|
"plants": 136,
|
|
"playing": 31,
|
|
"playing frisbee": 133,
|
|
"playing game": 146,
|
|
"playing video games": 43,
|
|
"pole": 59,
|
|
"poles": 95,
|
|
"posing": 108,
|
|
"privacy": 93,
|
|
"purse": 14,
|
|
"race": 174,
|
|
"racing": 68,
|
|
"red": 114,
|
|
"red and blue": 207,
|
|
"red and gray": 202,
|
|
"red and white": 148,
|
|
"red white and blue": 9,
|
|
"refrigerator": 39,
|
|
"relaxing": 88,
|
|
"remote": 102,
|
|
"remote control": 157,
|
|
"room": 76,
|
|
"safety": 90,
|
|
"salt": 105,
|
|
"sand": 54,
|
|
"several": 41,
|
|
"shade": 149,
|
|
"skateboard": 81,
|
|
"ski poles": 192,
|
|
"skis": 163,
|
|
"sleeping": 160,
|
|
"smile": 181,
|
|
"spoon": 162,
|
|
"square": 16,
|
|
"squares": 37,
|
|
"standing": 120,
|
|
"straw": 145,
|
|
"stuffed animal": 78,
|
|
"sun": 13,
|
|
"sunglasses": 153,
|
|
"sunny": 110,
|
|
"surfboard": 126,
|
|
"surfing": 12,
|
|
"taking picture": 208,
|
|
"tank": 10,
|
|
"teddy bear": 15,
|
|
"tennis": 96,
|
|
"tennis court": 176,
|
|
"throwing frisbee": 185,
|
|
"tile": 70,
|
|
"tired": 109,
|
|
"toothbrush": 33,
|
|
"tracks": 132,
|
|
"traffic": 171,
|
|
"train": 60,
|
|
"trash": 1,
|
|
"travel": 101,
|
|
"tree": 65,
|
|
"uk": 22,
|
|
"united states": 204,
|
|
"unknown": 190,
|
|
"unsure": 116,
|
|
"us": 79,
|
|
"usa": 137,
|
|
"waiting": 75,
|
|
"wall": 118,
|
|
"warmth": 23,
|
|
"water": 173,
|
|
"white": 152,
|
|
"white and black": 128,
|
|
"white and red": 122,
|
|
"wii": 177,
|
|
"windows": 205,
|
|
"windsurfing": 58,
|
|
"wood": 63,
|
|
"woods": 203,
|
|
"working": 123,
|
|
"yellow": 143,
|
|
"yes": 35
|
|
},
|
|
"layer_norm_eps": 1e-12,
|
|
"max_image_length": -1,
|
|
"max_position_embeddings": 40,
|
|
"modality_type_vocab_size": 2,
|
|
"model_type": "vilt",
|
|
"num_attention_heads": 12,
|
|
"num_channels": 3,
|
|
"num_hidden_layers": 12,
|
|
"num_images": -1,
|
|
"patch_size": 32,
|
|
"qkv_bias": true,
|
|
"tie_word_embeddings": false,
|
|
"torch_dtype": "float32",
|
|
"transformers_version": "4.40.1",
|
|
"type_vocab_size": 2,
|
|
"vocab_size": 30522
|
|
}
|
|
|