|
|
|
import os |
|
from typing import Optional |
|
import pkg_resources |
|
import torch |
|
|
|
from annotator.oneformer.detectron2.checkpoint import DetectionCheckpointer |
|
from annotator.oneformer.detectron2.config import CfgNode, LazyConfig, get_cfg, instantiate |
|
from annotator.oneformer.detectron2.modeling import build_model |
|
|
|
|
|
class _ModelZooUrls(object): |
|
""" |
|
Mapping from names to officially released Detectron2 pre-trained models. |
|
""" |
|
|
|
S3_PREFIX = "https://dl.fbaipublicfiles.com/detectron2/" |
|
|
|
|
|
CONFIG_PATH_TO_URL_SUFFIX = { |
|
|
|
"COCO-Detection/faster_rcnn_R_50_C4_1x": "137257644/model_final_721ade.pkl", |
|
"COCO-Detection/faster_rcnn_R_50_DC5_1x": "137847829/model_final_51d356.pkl", |
|
"COCO-Detection/faster_rcnn_R_50_FPN_1x": "137257794/model_final_b275ba.pkl", |
|
"COCO-Detection/faster_rcnn_R_50_C4_3x": "137849393/model_final_f97cb7.pkl", |
|
"COCO-Detection/faster_rcnn_R_50_DC5_3x": "137849425/model_final_68d202.pkl", |
|
"COCO-Detection/faster_rcnn_R_50_FPN_3x": "137849458/model_final_280758.pkl", |
|
"COCO-Detection/faster_rcnn_R_101_C4_3x": "138204752/model_final_298dad.pkl", |
|
"COCO-Detection/faster_rcnn_R_101_DC5_3x": "138204841/model_final_3e0943.pkl", |
|
"COCO-Detection/faster_rcnn_R_101_FPN_3x": "137851257/model_final_f6e8b1.pkl", |
|
"COCO-Detection/faster_rcnn_X_101_32x8d_FPN_3x": "139173657/model_final_68b088.pkl", |
|
|
|
"COCO-Detection/retinanet_R_50_FPN_1x": "190397773/model_final_bfca0b.pkl", |
|
"COCO-Detection/retinanet_R_50_FPN_3x": "190397829/model_final_5bd44e.pkl", |
|
"COCO-Detection/retinanet_R_101_FPN_3x": "190397697/model_final_971ab9.pkl", |
|
|
|
"COCO-Detection/rpn_R_50_C4_1x": "137258005/model_final_450694.pkl", |
|
"COCO-Detection/rpn_R_50_FPN_1x": "137258492/model_final_02ce48.pkl", |
|
"COCO-Detection/fast_rcnn_R_50_FPN_1x": "137635226/model_final_e5f7ce.pkl", |
|
|
|
"COCO-InstanceSegmentation/mask_rcnn_R_50_C4_1x": "137259246/model_final_9243eb.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_50_DC5_1x": "137260150/model_final_4f86c3.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_1x": "137260431/model_final_a54504.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_50_C4_3x": "137849525/model_final_4ce675.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_50_DC5_3x": "137849551/model_final_84107b.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_3x": "137849600/model_final_f10217.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_101_C4_3x": "138363239/model_final_a2914c.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_101_DC5_3x": "138363294/model_final_0464b7.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_R_101_FPN_3x": "138205316/model_final_a3ec72.pkl", |
|
"COCO-InstanceSegmentation/mask_rcnn_X_101_32x8d_FPN_3x": "139653917/model_final_2d9806.pkl", |
|
|
|
"new_baselines/mask_rcnn_R_50_FPN_100ep_LSJ": "42047764/model_final_bb69de.pkl", |
|
"new_baselines/mask_rcnn_R_50_FPN_200ep_LSJ": "42047638/model_final_89a8d3.pkl", |
|
"new_baselines/mask_rcnn_R_50_FPN_400ep_LSJ": "42019571/model_final_14d201.pkl", |
|
"new_baselines/mask_rcnn_R_101_FPN_100ep_LSJ": "42025812/model_final_4f7b58.pkl", |
|
"new_baselines/mask_rcnn_R_101_FPN_200ep_LSJ": "42131867/model_final_0bb7ae.pkl", |
|
"new_baselines/mask_rcnn_R_101_FPN_400ep_LSJ": "42073830/model_final_f96b26.pkl", |
|
"new_baselines/mask_rcnn_regnetx_4gf_dds_FPN_100ep_LSJ": "42047771/model_final_b7fbab.pkl", |
|
"new_baselines/mask_rcnn_regnetx_4gf_dds_FPN_200ep_LSJ": "42132721/model_final_5d87c1.pkl", |
|
"new_baselines/mask_rcnn_regnetx_4gf_dds_FPN_400ep_LSJ": "42025447/model_final_f1362d.pkl", |
|
"new_baselines/mask_rcnn_regnety_4gf_dds_FPN_100ep_LSJ": "42047784/model_final_6ba57e.pkl", |
|
"new_baselines/mask_rcnn_regnety_4gf_dds_FPN_200ep_LSJ": "42047642/model_final_27b9c1.pkl", |
|
"new_baselines/mask_rcnn_regnety_4gf_dds_FPN_400ep_LSJ": "42045954/model_final_ef3a80.pkl", |
|
|
|
"COCO-Keypoints/keypoint_rcnn_R_50_FPN_1x": "137261548/model_final_04e291.pkl", |
|
"COCO-Keypoints/keypoint_rcnn_R_50_FPN_3x": "137849621/model_final_a6e10b.pkl", |
|
"COCO-Keypoints/keypoint_rcnn_R_101_FPN_3x": "138363331/model_final_997cc7.pkl", |
|
"COCO-Keypoints/keypoint_rcnn_X_101_32x8d_FPN_3x": "139686956/model_final_5ad38f.pkl", |
|
|
|
"COCO-PanopticSegmentation/panoptic_fpn_R_50_1x": "139514544/model_final_dbfeb4.pkl", |
|
"COCO-PanopticSegmentation/panoptic_fpn_R_50_3x": "139514569/model_final_c10459.pkl", |
|
"COCO-PanopticSegmentation/panoptic_fpn_R_101_3x": "139514519/model_final_cafdb1.pkl", |
|
|
|
"LVISv0.5-InstanceSegmentation/mask_rcnn_R_50_FPN_1x": "144219072/model_final_571f7c.pkl", |
|
"LVISv0.5-InstanceSegmentation/mask_rcnn_R_101_FPN_1x": "144219035/model_final_824ab5.pkl", |
|
"LVISv0.5-InstanceSegmentation/mask_rcnn_X_101_32x8d_FPN_1x": "144219108/model_final_5e3439.pkl", |
|
|
|
"Cityscapes/mask_rcnn_R_50_FPN": "142423278/model_final_af9cf5.pkl", |
|
"PascalVOC-Detection/faster_rcnn_R_50_C4": "142202221/model_final_b1acc2.pkl", |
|
|
|
"Misc/mask_rcnn_R_50_FPN_1x_dconv_c3-c5": "138602867/model_final_65c703.pkl", |
|
"Misc/mask_rcnn_R_50_FPN_3x_dconv_c3-c5": "144998336/model_final_821d0b.pkl", |
|
"Misc/cascade_mask_rcnn_R_50_FPN_1x": "138602847/model_final_e9d89b.pkl", |
|
"Misc/cascade_mask_rcnn_R_50_FPN_3x": "144998488/model_final_480dd8.pkl", |
|
"Misc/mask_rcnn_R_50_FPN_3x_syncbn": "169527823/model_final_3b3c51.pkl", |
|
"Misc/mask_rcnn_R_50_FPN_3x_gn": "138602888/model_final_dc5d9e.pkl", |
|
"Misc/scratch_mask_rcnn_R_50_FPN_3x_gn": "138602908/model_final_01ca85.pkl", |
|
"Misc/scratch_mask_rcnn_R_50_FPN_9x_gn": "183808979/model_final_da7b4c.pkl", |
|
"Misc/scratch_mask_rcnn_R_50_FPN_9x_syncbn": "184226666/model_final_5ce33e.pkl", |
|
"Misc/panoptic_fpn_R_101_dconv_cascade_gn_3x": "139797668/model_final_be35db.pkl", |
|
"Misc/cascade_mask_rcnn_X_152_32x8d_FPN_IN5k_gn_dconv": "18131413/model_0039999_e76410.pkl", |
|
|
|
"Detectron1-Comparisons/faster_rcnn_R_50_FPN_noaug_1x": "137781054/model_final_7ab50c.pkl", |
|
"Detectron1-Comparisons/mask_rcnn_R_50_FPN_noaug_1x": "137781281/model_final_62ca52.pkl", |
|
"Detectron1-Comparisons/keypoint_rcnn_R_50_FPN_1x": "137781195/model_final_cce136.pkl", |
|
} |
|
|
|
@staticmethod |
|
def query(config_path: str) -> Optional[str]: |
|
""" |
|
Args: |
|
config_path: relative config filename |
|
""" |
|
name = config_path.replace(".yaml", "").replace(".py", "") |
|
if name in _ModelZooUrls.CONFIG_PATH_TO_URL_SUFFIX: |
|
suffix = _ModelZooUrls.CONFIG_PATH_TO_URL_SUFFIX[name] |
|
return _ModelZooUrls.S3_PREFIX + name + "/" + suffix |
|
return None |
|
|
|
|
|
def get_checkpoint_url(config_path): |
|
""" |
|
Returns the URL to the model trained using the given config |
|
|
|
Args: |
|
config_path (str): config file name relative to detectron2's "configs/" |
|
directory, e.g., "COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml" |
|
|
|
Returns: |
|
str: a URL to the model |
|
""" |
|
url = _ModelZooUrls.query(config_path) |
|
if url is None: |
|
raise RuntimeError("Pretrained model for {} is not available!".format(config_path)) |
|
return url |
|
|
|
|
|
def get_config_file(config_path): |
|
""" |
|
Returns path to a builtin config file. |
|
|
|
Args: |
|
config_path (str): config file name relative to detectron2's "configs/" |
|
directory, e.g., "COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml" |
|
|
|
Returns: |
|
str: the real path to the config file. |
|
""" |
|
cfg_file = pkg_resources.resource_filename( |
|
"detectron2.model_zoo", os.path.join("configs", config_path) |
|
) |
|
if not os.path.exists(cfg_file): |
|
raise RuntimeError("{} not available in Model Zoo!".format(config_path)) |
|
return cfg_file |
|
|
|
|
|
def get_config(config_path, trained: bool = False): |
|
""" |
|
Returns a config object for a model in model zoo. |
|
|
|
Args: |
|
config_path (str): config file name relative to detectron2's "configs/" |
|
directory, e.g., "COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml" |
|
trained (bool): If True, will set ``MODEL.WEIGHTS`` to trained model zoo weights. |
|
If False, the checkpoint specified in the config file's ``MODEL.WEIGHTS`` is used |
|
instead; this will typically (though not always) initialize a subset of weights using |
|
an ImageNet pre-trained model, while randomly initializing the other weights. |
|
|
|
Returns: |
|
CfgNode or omegaconf.DictConfig: a config object |
|
""" |
|
cfg_file = get_config_file(config_path) |
|
if cfg_file.endswith(".yaml"): |
|
cfg = get_cfg() |
|
cfg.merge_from_file(cfg_file) |
|
if trained: |
|
cfg.MODEL.WEIGHTS = get_checkpoint_url(config_path) |
|
return cfg |
|
elif cfg_file.endswith(".py"): |
|
cfg = LazyConfig.load(cfg_file) |
|
if trained: |
|
url = get_checkpoint_url(config_path) |
|
if "train" in cfg and "init_checkpoint" in cfg.train: |
|
cfg.train.init_checkpoint = url |
|
else: |
|
raise NotImplementedError |
|
return cfg |
|
|
|
|
|
def get(config_path, trained: bool = False, device: Optional[str] = None): |
|
""" |
|
Get a model specified by relative path under Detectron2's official ``configs/`` directory. |
|
|
|
Args: |
|
config_path (str): config file name relative to detectron2's "configs/" |
|
directory, e.g., "COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml" |
|
trained (bool): see :func:`get_config`. |
|
device (str or None): overwrite the device in config, if given. |
|
|
|
Returns: |
|
nn.Module: a detectron2 model. Will be in training mode. |
|
|
|
Example: |
|
:: |
|
from annotator.oneformer.detectron2 import model_zoo |
|
model = model_zoo.get("COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml", trained=True) |
|
""" |
|
cfg = get_config(config_path, trained) |
|
if device is None and not torch.cuda.is_available(): |
|
device = "cpu" |
|
if device is not None and isinstance(cfg, CfgNode): |
|
cfg.MODEL.DEVICE = device |
|
|
|
if isinstance(cfg, CfgNode): |
|
model = build_model(cfg) |
|
DetectionCheckpointer(model).load(cfg.MODEL.WEIGHTS) |
|
else: |
|
model = instantiate(cfg.model) |
|
if device is not None: |
|
model = model.to(device) |
|
if "train" in cfg and "init_checkpoint" in cfg.train: |
|
DetectionCheckpointer(model).load(cfg.train.init_checkpoint) |
|
return model |
|
|