Spaces:
Runtime error
Runtime error
| # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved. | |
| import torch | |
| from torch import nn | |
| from maskrcnn_benchmark.structures.bounding_box import BoxList | |
| from .roi_mask_feature_extractors import make_roi_mask_feature_extractor | |
| from .roi_mask_predictors import make_roi_mask_predictor | |
| from .inference import make_roi_mask_post_processor | |
| from .loss import make_roi_mask_loss_evaluator | |
| def keep_only_positive_boxes(boxes): | |
| """ | |
| Given a set of BoxList containing the `labels` field, | |
| return a set of BoxList for which `labels > 0`. | |
| Arguments: | |
| boxes (list of BoxList) | |
| """ | |
| assert isinstance(boxes, (list, tuple)) | |
| assert isinstance(boxes[0], BoxList) | |
| assert boxes[0].has_field("labels") | |
| positive_boxes = [] | |
| positive_inds = [] | |
| num_boxes = 0 | |
| for boxes_per_image in boxes: | |
| labels = boxes_per_image.get_field("labels") | |
| inds_mask = labels > 0 | |
| inds = inds_mask.nonzero().squeeze(1) | |
| positive_boxes.append(boxes_per_image[inds]) | |
| positive_inds.append(inds_mask) | |
| return positive_boxes, positive_inds | |
| class ROIMaskHead(torch.nn.Module): | |
| def __init__(self, cfg): | |
| super(ROIMaskHead, self).__init__() | |
| self.cfg = cfg.clone() | |
| self.feature_extractor = make_roi_mask_feature_extractor(cfg) | |
| self.predictor = make_roi_mask_predictor(cfg) | |
| self.post_processor = make_roi_mask_post_processor(cfg) | |
| self.loss_evaluator = make_roi_mask_loss_evaluator(cfg) | |
| def forward(self, features, proposals, targets=None, | |
| language_dict_features=None, | |
| positive_map_label_to_token=None | |
| ): | |
| """ | |
| Arguments: | |
| features (list[Tensor]): feature-maps from possibly several levels | |
| proposals (list[BoxList]): proposal boxes | |
| targets (list[BoxList], optional): the ground-truth targets. | |
| language_dict_features: language features: hidden, embedding, mask, ... | |
| Returns: | |
| x (Tensor): the result of the feature extractor | |
| proposals (list[BoxList]): during training, the original proposals | |
| are returned. During testing, the predicted boxlists are returned | |
| with the `mask` field set | |
| losses (dict[Tensor]): During training, returns the losses for the | |
| head. During testing, returns an empty dict. | |
| """ | |
| if self.training: | |
| # during training, only focus on positive boxes | |
| all_proposals = proposals | |
| proposals, positive_inds = keep_only_positive_boxes(proposals) | |
| if self.training and self.cfg.MODEL.ROI_MASK_HEAD.SHARE_BOX_FEATURE_EXTRACTOR: | |
| x = features | |
| x = x[torch.cat(positive_inds, dim=0)] | |
| else: | |
| x = self.feature_extractor(features, proposals) | |
| if self.cfg.MODEL.ROI_MASK_HEAD.PREDICTOR.startswith("VL"): | |
| mask_logits = self.predictor(x, language_dict_features) | |
| else: | |
| mask_logits = self.predictor(x) | |
| if not self.training: | |
| result = self.post_processor(mask_logits, proposals, positive_map_label_to_token) | |
| return x, result, {} | |
| loss_mask = self.loss_evaluator(proposals, mask_logits, targets) | |
| return x, all_proposals, dict(loss_mask=loss_mask) | |
| def build_roi_mask_head(cfg): | |
| return ROIMaskHead(cfg) | |