{ "_name_or_path": "facebook/detr-resnet-50", "activation_dropout": 0.0, "activation_function": "relu", "architectures": [ "DetrForObjectDetection" ], "attention_dropout": 0.0, "auxiliary_loss": false, "backbone": "resnet50", "backbone_config": null, "backbone_kwargs": { "in_chans": 3, "out_indices": [ 1, 2, 3, 4 ] }, "bbox_cost": 5, "bbox_loss_coefficient": 5, "class_cost": 1, "classifier_dropout": 0.0, "d_model": 256, "decoder_attention_heads": 8, "decoder_ffn_dim": 2048, "decoder_layerdrop": 0.0, "decoder_layers": 6, "dice_loss_coefficient": 1, "dilation": false, "dropout": 0.1, "encoder_attention_heads": 8, "encoder_ffn_dim": 2048, "encoder_layerdrop": 0.0, "encoder_layers": 6, "eos_coefficient": 0.1, "giou_cost": 2, "giou_loss_coefficient": 2, "id2label": { "1": 28, "2": 30, "3": 72, "4": 73, "5": 81, "6": 80, "7": 78, "8": 79, "9": 53, "10": 3, "11": 81, "12": 80, "13": 78, "14": 92, "15": 101, "16": 100, "17": 102, "18": 95, "19": 96, "20": 90, "21": 91, "22": 28, "23": 29, "24": 74, "25": 94, "26": 92, "27": 25, "28": 23, "29": 24, "30": 92, "31": 93, "32": 52, "33": 36, "34": 37, "35": 38, "36": 82, "37": 83, "38": 32, "39": 42, "40": 43, "41": 14, "42": 16, "43": 74, "44": 23, "45": 24, "46": 57, "47": 58, "48": 20, "49": 19, "50": 50, "51": 8, "52": 63, "53": 76, "54": 77, "55": 8, "56": 35, "57": 34, "58": 15, "59": 12, "60": 53, "61": 101, "62": 100, "63": 102, "64": 51, "65": 39, "66": 40, "67": 7, "68": 9, "69": 74, "70": 75, "71": 7, "72": 10, "73": 67, "74": 47, "75": 48, "76": 44, "77": 45, "78": 46, "79": 31, "80": 87, "81": 89, "82": 97, "83": 98, "84": 99, "85": 84, "86": 28, "87": 29, "88": 103, "89": 104, "90": 105, "91": 32, "92": 33, "93": 26, "94": 22, "95": 20, "96": 19, "97": 98, "98": 99, "99": 21, "100": 15, "101": 12, "102": 51, "103": 10, "104": 87, "105": 85, "106": 86, "107": 97, "108": 98, "109": 99, "110": 49, "111": 26, "112": 27, "113": 68, "114": 17, "115": 69, "116": 53, "117": 1, "118": 14, "119": 63, "120": 63, "121": 11, "122": 13, "123": 6, "124": 63, "125": 64, "126": 54, "127": 55, "128": 56, "129": 57, "130": 58, "131": 70, "132": 18, "133": 67, "134": 106, "135": 107, "136": 2, "137": 59, "138": 60, "139": 35, "140": 34, "141": 61, "142": 62, "143": 41, "144": 42, "145": 106, "146": 107, "147": 2, "148": 83, "149": 66, "150": 20, "151": 19, "152": 72, "153": 87, "154": 88, "155": 61, "156": 62, "157": 70, "158": 71, "159": 4 }, "init_std": 0.02, "init_xavier_std": 1.0, "is_encoder_decoder": true, "label2id": { "1": 117, "2": 147, "3": 10, "4": 159, "6": 123, "7": 71, "8": 55, "9": 68, "10": 103, "11": 121, "12": 101, "13": 122, "14": 118, "15": 100, "16": 42, "17": 114, "18": 132, "19": 151, "20": 150, "21": 99, "22": 94, "23": 44, "24": 45, "25": 27, "26": 111, "27": 112, "28": 86, "29": 87, "30": 2, "31": 79, "32": 91, "33": 92, "34": 140, "35": 139, "36": 33, "37": 34, "38": 35, "39": 65, "40": 66, "41": 143, "42": 144, "43": 40, "44": 76, "45": 77, "46": 78, "47": 74, "48": 75, "49": 110, "50": 50, "51": 102, "52": 32, "53": 116, "54": 126, "55": 127, "56": 128, "57": 129, "58": 130, "59": 137, "60": 138, "61": 155, "62": 156, "63": 124, "64": 125, "66": 149, "67": 133, "68": 113, "69": 115, "70": 157, "71": 158, "72": 152, "73": 4, "74": 69, "75": 70, "76": 53, "77": 54, "78": 13, "79": 8, "80": 12, "81": 11, "82": 36, "83": 148, "84": 85, "85": 105, "86": 106, "87": 153, "88": 154, "89": 81, "90": 20, "91": 21, "92": 30, "93": 31, "94": 25, "95": 18, "96": 19, "97": 107, "98": 108, "99": 109, "100": 62, "101": 61, "102": 63, "103": 88, "104": 89, "105": 90, "106": 145, "107": 146 }, "mask_loss_coefficient": 1, "max_position_embeddings": 1024, "model_type": "detr", "num_channels": 3, "num_hidden_layers": 6, "num_queries": 100, "position_embedding_type": "sine", "scale_embedding": false, "torch_dtype": "float32", "transformers_version": "4.41.0", "use_pretrained_backbone": true, "use_timm_backbone": true }