{ "_name_or_path": "facebook/detr-resnet-50-dc5", "activation_dropout": 0.0, "activation_function": "relu", "architectures": [ "DetrForObjectDetection" ], "attention_dropout": 0.0, "auxiliary_loss": false, "backbone": "resnet50", "backbone_config": null, "backbone_kwargs": { "in_chans": 3, "out_indices": [ 1, 2, 3, 4 ], "output_stride": 16 }, "bbox_cost": 5, "bbox_loss_coefficient": 5, "class_cost": 1, "classifier_dropout": 0.0, "d_model": 256, "decoder_attention_heads": 8, "decoder_ffn_dim": 2048, "decoder_layerdrop": 0.0, "decoder_layers": 6, "dice_loss_coefficient": 1, "dilation": true, "dropout": 0.1, "encoder_attention_heads": 8, "encoder_ffn_dim": 2048, "encoder_layerdrop": 0.0, "encoder_layers": 6, "eos_coefficient": 0.1, "giou_cost": 2, "giou_loss_coefficient": 2, "id2label": { "0": "N/A", "1": "person", "10": "traffic light", "11": "fire hydrant", "12": "N/A", "13": "stop sign", "14": "parking meter", "15": "bench", "16": "bird", "17": "cat", "18": "dog", "19": "horse", "2": "bicycle", "20": "sheep", "21": "cow", "22": "elephant", "23": "bear", "24": "zebra", "25": "giraffe", "26": "N/A", "27": "backpack", "28": "umbrella", "29": "N/A", "3": "car", "30": "N/A", "31": "handbag", "32": "tie", "33": "suitcase", "34": "frisbee", "35": "skis", "36": "snowboard", "37": "sports ball", "38": "kite", "39": "baseball bat", "4": "motorcycle", "40": "baseball glove", "41": "skateboard", "42": "surfboard", "43": "tennis racket", "44": "bottle", "45": "N/A", "46": "wine glass", "47": "cup", "48": "fork", "49": "knife", "5": "airplane", "50": "spoon", "51": "bowl", "52": "banana", "53": "apple", "54": "sandwich", "55": "orange", "56": "broccoli", "57": "carrot", "58": "hot dog", "59": "pizza", "6": "bus", "60": "donut", "61": "cake", "62": "chair", "63": "couch", "64": "potted plant", "65": "bed", "66": "N/A", "67": "dining table", "68": "N/A", "69": "N/A", "7": "train", "70": "toilet", "71": "N/A", "72": "tv", "73": "laptop", "74": "mouse", "75": "remote", "76": "keyboard", "77": "cell phone", "78": "microwave", "79": "oven", "8": "truck", "80": "toaster", "81": "sink", "82": "refrigerator", "83": "N/A", "84": "book", "85": "clock", "86": "vase", "87": "scissors", "88": "teddy bear", "89": "hair drier", "9": "boat", "90": "toothbrush" }, "init_std": 0.02, "init_xavier_std": 1.0, "is_encoder_decoder": true, "label2id": { "N/A": "83", "airplane": "5", "apple": "53", "backpack": "27", "banana": "52", "baseball bat": "39", "baseball glove": "40", "bear": "23", "bed": "65", "bench": "15", "bicycle": "2", "bird": "16", "boat": "9", "book": "84", "bottle": "44", "bowl": "51", "broccoli": "56", "bus": "6", "cake": "61", "car": "3", "carrot": "57", "cat": "17", "cell phone": "77", "chair": "62", "clock": "85", "couch": "63", "cow": "21", "cup": "47", "dining table": "67", "dog": "18", "donut": "60", "elephant": "22", "fire hydrant": "11", "fork": "48", "frisbee": "34", "giraffe": "25", "hair drier": "89", "handbag": "31", "horse": "19", "hot dog": "58", "keyboard": "76", "kite": "38", "knife": "49", "laptop": "73", "microwave": "78", "motorcycle": "4", "mouse": "74", "orange": "55", "oven": "79", "parking meter": "14", "person": "1", "pizza": "59", "potted plant": "64", "refrigerator": "82", "remote": "75", "sandwich": "54", "scissors": "87", "sheep": "20", "sink": "81", "skateboard": "41", "skis": "35", "snowboard": "36", "spoon": "50", "sports ball": "37", "stop sign": "13", "suitcase": "33", "surfboard": "42", "teddy bear": "88", "tennis racket": "43", "tie": "32", "toaster": "80", "toilet": "70", "toothbrush": "90", "traffic light": "10", "train": "7", "truck": "8", "tv": "72", "umbrella": "28", "vase": "86", "wine glass": "46", "zebra": "24" }, "mask_loss_coefficient": 1, "max_position_embeddings": 1024, "model_type": "detr", "num_channels": 3, "num_hidden_layers": 6, "num_queries": 100, "position_embedding_type": "sine", "scale_embedding": false, "torch_dtype": "float32", "transformers_version": "4.47.1", "use_pretrained_backbone": true, "use_timm_backbone": true }