| """
|
| Integrate numerical values for some iterations
|
| Typically used for loss computation / logging to tensorboard
|
| Call finalize and create a new Integrator when you want to display/log
|
| """
|
| from typing import Callable, Union
|
|
|
| import torch
|
|
|
| from .logger import TensorboardLogger
|
| from .tensor_utils import distribute_into_histogram
|
|
|
|
|
| class Integrator:
|
|
|
| def __init__(self, logger: TensorboardLogger, distributed: bool = True):
|
| self.values = {}
|
| self.counts = {}
|
| self.hooks = []
|
|
|
|
|
| self.binned_tensors = {}
|
| self.binned_tensor_indices = {}
|
|
|
| self.logger = logger
|
|
|
| self.distributed = distributed
|
| self.local_rank = torch.distributed.get_rank()
|
| self.world_size = torch.distributed.get_world_size()
|
|
|
| def add_scalar(self, key: str, x: Union[torch.Tensor, int, float]):
|
| if isinstance(x, torch.Tensor):
|
| x = x.detach()
|
| if x.dtype in [torch.long, torch.int, torch.bool]:
|
| x = x.float()
|
|
|
| if key not in self.values:
|
| self.counts[key] = 1
|
| self.values[key] = x
|
| else:
|
| self.counts[key] += 1
|
| self.values[key] += x
|
|
|
| def add_dict(self, tensor_dict: dict[str, torch.Tensor]):
|
| for k, v in tensor_dict.items():
|
| self.add_scalar(k, v)
|
|
|
| def add_binned_tensor(self, key: str, x: torch.Tensor, indices: torch.Tensor):
|
| if key not in self.binned_tensors:
|
| self.binned_tensors[key] = [x.detach().flatten()]
|
| self.binned_tensor_indices[key] = [indices.detach().flatten()]
|
| else:
|
| self.binned_tensors[key].append(x.detach().flatten())
|
| self.binned_tensor_indices[key].append(indices.detach().flatten())
|
|
|
| def add_hook(self, hook: Callable[[torch.Tensor], tuple[str, torch.Tensor]]):
|
| """
|
| Adds a custom hook, i.e. compute new metrics using values in the dict
|
| The hook takes the dict as argument, and returns a (k, v) tuple
|
| e.g. for computing IoU
|
| """
|
| self.hooks.append(hook)
|
|
|
| def reset_except_hooks(self):
|
| self.values = {}
|
| self.counts = {}
|
|
|
|
|
| def finalize(self, prefix: str, it: int, ignore_timer: bool = False) -> None:
|
|
|
| for hook in self.hooks:
|
| k, v = hook(self.values)
|
| self.add_scalar(k, v)
|
|
|
|
|
| outputs = {}
|
| for k, v in self.values.items():
|
| avg = v / self.counts[k]
|
| if self.distributed:
|
|
|
| if isinstance(avg, torch.Tensor):
|
| avg = avg.cuda()
|
| else:
|
| avg = torch.tensor(avg).cuda()
|
| torch.distributed.reduce(avg, dst=0)
|
|
|
| if self.local_rank == 0:
|
| avg = (avg / self.world_size).cpu().item()
|
| outputs[k] = avg
|
| else:
|
|
|
| outputs[k] = avg
|
|
|
| if (not self.distributed) or (self.local_rank == 0):
|
| self.logger.log_metrics(prefix, outputs, it, ignore_timer=ignore_timer)
|
|
|
|
|
| for k, v in self.binned_tensors.items():
|
| x = torch.cat(v, dim=0)
|
| indices = torch.cat(self.binned_tensor_indices[k], dim=0)
|
| hist, count = distribute_into_histogram(x, indices)
|
|
|
| if self.distributed:
|
| torch.distributed.reduce(hist, dst=0)
|
| torch.distributed.reduce(count, dst=0)
|
| if self.local_rank == 0:
|
| hist = hist / count
|
| else:
|
| hist = hist / count
|
|
|
| if (not self.distributed) or (self.local_rank == 0):
|
| self.logger.log_histogram(f'{prefix}/{k}', hist, it)
|
|
|