Spaces:

Pinwheel
/

GLIP-BLIP-Object-Detection-VQA

Runtime error

App Files Files Community

GLIP-BLIP-Object-Detection-VQA / maskrcnn_benchmark /modeling /roi_heads /mask_head /mask_head.py

Pinwheel

HF Demo

128757a about 3 years ago

raw

history blame contribute delete

3.49 kB

	# Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
	import torch
	from torch import nn

	from maskrcnn_benchmark.structures.bounding_box import BoxList

	from .roi_mask_feature_extractors import make_roi_mask_feature_extractor
	from .roi_mask_predictors import make_roi_mask_predictor
	from .inference import make_roi_mask_post_processor
	from .loss import make_roi_mask_loss_evaluator


	def keep_only_positive_boxes(boxes):
	"""
	Given a set of BoxList containing the `labels` field,
	return a set of BoxList for which `labels > 0`.

	Arguments:
	boxes (list of BoxList)
	"""
	assert isinstance(boxes, (list, tuple))
	assert isinstance(boxes[0], BoxList)
	assert boxes[0].has_field("labels")
	positive_boxes = []
	positive_inds = []
	num_boxes = 0
	for boxes_per_image in boxes:
	labels = boxes_per_image.get_field("labels")
	inds_mask = labels > 0
	inds = inds_mask.nonzero().squeeze(1)
	positive_boxes.append(boxes_per_image[inds])
	positive_inds.append(inds_mask)
	return positive_boxes, positive_inds


	class ROIMaskHead(torch.nn.Module):
	def __init__(self, cfg):
	super(ROIMaskHead, self).__init__()
	self.cfg = cfg.clone()
	self.feature_extractor = make_roi_mask_feature_extractor(cfg)
	self.predictor = make_roi_mask_predictor(cfg)
	self.post_processor = make_roi_mask_post_processor(cfg)
	self.loss_evaluator = make_roi_mask_loss_evaluator(cfg)

	def forward(self, features, proposals, targets=None,
	language_dict_features=None,
	positive_map_label_to_token=None
	):
	"""
	Arguments:
	features (list[Tensor]): feature-maps from possibly several levels
	proposals (list[BoxList]): proposal boxes
	targets (list[BoxList], optional): the ground-truth targets.
	language_dict_features: language features: hidden, embedding, mask, ...

	Returns:
	x (Tensor): the result of the feature extractor
	proposals (list[BoxList]): during training, the original proposals
	are returned. During testing, the predicted boxlists are returned
	with the `mask` field set
	losses (dict[Tensor]): During training, returns the losses for the
	head. During testing, returns an empty dict.
	"""
	if self.training:
	# during training, only focus on positive boxes
	all_proposals = proposals
	proposals, positive_inds = keep_only_positive_boxes(proposals)
	if self.training and self.cfg.MODEL.ROI_MASK_HEAD.SHARE_BOX_FEATURE_EXTRACTOR:
	x = features
	x = x[torch.cat(positive_inds, dim=0)]
	else:
	x = self.feature_extractor(features, proposals)
	if self.cfg.MODEL.ROI_MASK_HEAD.PREDICTOR.startswith("VL"):
	mask_logits = self.predictor(x, language_dict_features)
	else:
	mask_logits = self.predictor(x)

	if not self.training:
	result = self.post_processor(mask_logits, proposals, positive_map_label_to_token)
	return x, result, {}

	loss_mask = self.loss_evaluator(proposals, mask_logits, targets)

	return x, all_proposals, dict(loss_mask=loss_mask)


	def build_roi_mask_head(cfg):
	return ROIMaskHead(cfg)