| import torch |
| import torch.nn as nn |
| import torch.nn.functional as F |
|
|
|
|
| DEFAULT_TRIVEC_CONFIG = { |
| 'dim': 8, |
| 'rank': 8, |
| } |
|
|
| DEFAULT_VOXEL_CONFIG = { |
| 'solid': False, |
| } |
|
|
| DEFAULT_DECOPOLY_CONFIG = { |
| 'degree': 8, |
| 'rank': 16, |
| } |
|
|
|
|
| class DfsOctree: |
| """ |
| Sparse Voxel Octree (SVO) implementation for PyTorch. |
| Using Depth-First Search (DFS) order to store the octree. |
| DFS order suits rendering and ray tracing. |
| |
| The structure and data are separatedly stored. |
| Structure is stored as a continuous array, each element is a 3*32 bits descriptor. |
| |-----------------------------------------| |
| | 0:3 bits | 4:31 bits | |
| | leaf num | unused | |
| |-----------------------------------------| |
| | 0:31 bits | |
| | child ptr | |
| |-----------------------------------------| |
| | 0:31 bits | |
| | data ptr | |
| |-----------------------------------------| |
| Each element represents a non-leaf node in the octree. |
| The valid mask is used to indicate whether the children are valid. |
| The leaf mask is used to indicate whether the children are leaf nodes. |
| The child ptr is used to point to the first non-leaf child. Non-leaf children descriptors are stored continuously from the child ptr. |
| The data ptr is used to point to the data of leaf children. Leaf children data are stored continuously from the data ptr. |
| |
| There are also auxiliary arrays to store the additional structural information to facilitate parallel processing. |
| - Position: the position of the octree nodes. |
| - Depth: the depth of the octree nodes. |
| |
| Args: |
| depth (int): the depth of the octree. |
| """ |
|
|
| def __init__( |
| self, |
| depth, |
| aabb=[0,0,0,1,1,1], |
| sh_degree=2, |
| primitive='voxel', |
| primitive_config={}, |
| device='cuda', |
| ): |
| self.max_depth = depth |
| self.aabb = torch.tensor(aabb, dtype=torch.float32, device=device) |
| self.device = device |
| self.sh_degree = sh_degree |
| self.active_sh_degree = sh_degree |
| self.primitive = primitive |
| self.primitive_config = primitive_config |
|
|
| self.structure = torch.tensor([[8, 1, 0]], dtype=torch.int32, device=self.device) |
| self.position = torch.zeros((8, 3), dtype=torch.float32, device=self.device) |
| self.depth = torch.zeros((8, 1), dtype=torch.uint8, device=self.device) |
| self.position[:, 0] = torch.tensor([0.25, 0.75, 0.25, 0.75, 0.25, 0.75, 0.25, 0.75], device=self.device) |
| self.position[:, 1] = torch.tensor([0.25, 0.25, 0.75, 0.75, 0.25, 0.25, 0.75, 0.75], device=self.device) |
| self.position[:, 2] = torch.tensor([0.25, 0.25, 0.25, 0.25, 0.75, 0.75, 0.75, 0.75], device=self.device) |
| self.depth[:, 0] = 1 |
|
|
| self.data = ['position', 'depth'] |
| self.param_names = [] |
|
|
| if primitive == 'voxel': |
| self.features_dc = torch.zeros((8, 1, 3), dtype=torch.float32, device=self.device) |
| self.features_ac = torch.zeros((8, (sh_degree+1)**2-1, 3), dtype=torch.float32, device=self.device) |
| self.data += ['features_dc', 'features_ac'] |
| self.param_names += ['features_dc', 'features_ac'] |
| if not primitive_config.get('solid', False): |
| self.density = torch.zeros((8, 1), dtype=torch.float32, device=self.device) |
| self.data.append('density') |
| self.param_names.append('density') |
| elif primitive == 'gaussian': |
| self.features_dc = torch.zeros((8, 1, 3), dtype=torch.float32, device=self.device) |
| self.features_ac = torch.zeros((8, (sh_degree+1)**2-1, 3), dtype=torch.float32, device=self.device) |
| self.opacity = torch.zeros((8, 1), dtype=torch.float32, device=self.device) |
| self.data += ['features_dc', 'features_ac', 'opacity'] |
| self.param_names += ['features_dc', 'features_ac', 'opacity'] |
| elif primitive == 'trivec': |
| self.trivec = torch.zeros((8, primitive_config['rank'], 3, primitive_config['dim']), dtype=torch.float32, device=self.device) |
| self.density = torch.zeros((8, primitive_config['rank']), dtype=torch.float32, device=self.device) |
| self.features_dc = torch.zeros((8, primitive_config['rank'], 1, 3), dtype=torch.float32, device=self.device) |
| self.features_ac = torch.zeros((8, primitive_config['rank'], (sh_degree+1)**2-1, 3), dtype=torch.float32, device=self.device) |
| self.density_shift = 0 |
| self.data += ['trivec', 'density', 'features_dc', 'features_ac'] |
| self.param_names += ['trivec', 'density', 'features_dc', 'features_ac'] |
| elif primitive == 'decoupoly': |
| self.decoupoly_V = torch.zeros((8, primitive_config['rank'], 3), dtype=torch.float32, device=self.device) |
| self.decoupoly_g = torch.zeros((8, primitive_config['rank'], primitive_config['degree']), dtype=torch.float32, device=self.device) |
| self.density = torch.zeros((8, primitive_config['rank']), dtype=torch.float32, device=self.device) |
| self.features_dc = torch.zeros((8, primitive_config['rank'], 1, 3), dtype=torch.float32, device=self.device) |
| self.features_ac = torch.zeros((8, primitive_config['rank'], (sh_degree+1)**2-1, 3), dtype=torch.float32, device=self.device) |
| self.density_shift = 0 |
| self.data += ['decoupoly_V', 'decoupoly_g', 'density', 'features_dc', 'features_ac'] |
| self.param_names += ['decoupoly_V', 'decoupoly_g', 'density', 'features_dc', 'features_ac'] |
|
|
| self.setup_functions() |
|
|
| def setup_functions(self): |
| self.density_activation = (lambda x: torch.exp(x - 2)) if self.primitive != 'trivec' else (lambda x: x) |
| self.opacity_activation = lambda x: torch.sigmoid(x - 6) |
| self.inverse_opacity_activation = lambda x: torch.log(x / (1 - x)) + 6 |
| self.color_activation = lambda x: torch.sigmoid(x) |
|
|
| @property |
| def num_non_leaf_nodes(self): |
| return self.structure.shape[0] |
| |
| @property |
| def num_leaf_nodes(self): |
| return self.depth.shape[0] |
|
|
| @property |
| def cur_depth(self): |
| return self.depth.max().item() |
| |
| @property |
| def occupancy(self): |
| return self.num_leaf_nodes / 8 ** self.cur_depth |
| |
| @property |
| def get_xyz(self): |
| return self.position |
|
|
| @property |
| def get_depth(self): |
| return self.depth |
|
|
| @property |
| def get_density(self): |
| if self.primitive == 'voxel' and self.voxel_config['solid']: |
| return torch.full((self.position.shape[0], 1), 1000, dtype=torch.float32, device=self.device) |
| return self.density_activation(self.density) |
| |
| @property |
| def get_opacity(self): |
| return self.opacity_activation(self.density) |
|
|
| @property |
| def get_trivec(self): |
| return self.trivec |
|
|
| @property |
| def get_decoupoly(self): |
| return F.normalize(self.decoupoly_V, dim=-1), self.decoupoly_g |
|
|
| @property |
| def get_color(self): |
| return self.color_activation(self.colors) |
|
|
| @property |
| def get_features(self): |
| if self.sh_degree == 0: |
| return self.features_dc |
| return torch.cat([self.features_dc, self.features_ac], dim=-2) |
|
|
| def state_dict(self): |
| ret = {'structure': self.structure, 'position': self.position, 'depth': self.depth, 'sh_degree': self.sh_degree, 'active_sh_degree': self.active_sh_degree, 'trivec_config': self.trivec_config, 'voxel_config': self.voxel_config, 'primitive': self.primitive} |
| if hasattr(self, 'density_shift'): |
| ret['density_shift'] = self.density_shift |
| for data in set(self.data + self.param_names): |
| if not isinstance(getattr(self, data), nn.Module): |
| ret[data] = getattr(self, data) |
| else: |
| ret[data] = getattr(self, data).state_dict() |
| return ret |
|
|
| def load_state_dict(self, state_dict): |
| keys = list(set(self.data + self.param_names + list(state_dict.keys()) + ['structure', 'position', 'depth'])) |
| for key in keys: |
| if key not in state_dict: |
| print(f"Warning: key {key} not found in the state_dict.") |
| continue |
| try: |
| if not isinstance(getattr(self, key), nn.Module): |
| setattr(self, key, state_dict[key]) |
| else: |
| getattr(self, key).load_state_dict(state_dict[key]) |
| except Exception as e: |
| print(e) |
| raise ValueError(f"Error loading key {key}.") |
|
|
| def gather_from_leaf_children(self, data): |
| """ |
| Gather the data from the leaf children. |
| |
| Args: |
| data (torch.Tensor): the data to gather. The first dimension should be the number of leaf nodes. |
| """ |
| leaf_cnt = self.structure[:, 0] |
| leaf_cnt_masks = [leaf_cnt == i for i in range(1, 9)] |
| ret = torch.zeros((self.num_non_leaf_nodes,), dtype=data.dtype, device=self.device) |
| for i in range(8): |
| if leaf_cnt_masks[i].sum() == 0: |
| continue |
| start = self.structure[leaf_cnt_masks[i], 2] |
| for j in range(i+1): |
| ret[leaf_cnt_masks[i]] += data[start + j] |
| return ret |
|
|
| def gather_from_non_leaf_children(self, data): |
| """ |
| Gather the data from the non-leaf children. |
| |
| Args: |
| data (torch.Tensor): the data to gather. The first dimension should be the number of leaf nodes. |
| """ |
| non_leaf_cnt = 8 - self.structure[:, 0] |
| non_leaf_cnt_masks = [non_leaf_cnt == i for i in range(1, 9)] |
| ret = torch.zeros_like(data, device=self.device) |
| for i in range(8): |
| if non_leaf_cnt_masks[i].sum() == 0: |
| continue |
| start = self.structure[non_leaf_cnt_masks[i], 1] |
| for j in range(i+1): |
| ret[non_leaf_cnt_masks[i]] += data[start + j] |
| return ret |
|
|
| def structure_control(self, mask): |
| """ |
| Control the structure of the octree. |
| |
| Args: |
| mask (torch.Tensor): the mask to control the structure. 1 for subdivide, -1 for merge, 0 for keep. |
| """ |
| |
| mask[self.depth.squeeze() == self.max_depth] = torch.clamp_max(mask[self.depth.squeeze() == self.max_depth], 0) |
| |
| mask[self.depth.squeeze() == 1] = torch.clamp_min(mask[self.depth.squeeze() == 1], 0) |
|
|
| |
| structre_ctrl = self.gather_from_leaf_children(mask) |
| structre_ctrl[structre_ctrl==-8] = -1 |
|
|
| new_leaf_num = self.structure[:, 0].clone() |
| |
| structre_valid = structre_ctrl >= 0 |
| new_leaf_num[structre_valid] -= structre_ctrl[structre_valid] |
| structre_delete = structre_ctrl < 0 |
| merged_nodes = self.gather_from_non_leaf_children(structre_delete.int()) |
| new_leaf_num += merged_nodes |
|
|
| |
| mem_offset = torch.zeros((self.num_non_leaf_nodes + 1,), dtype=torch.int32, device=self.device) |
| mem_offset.index_add_(0, self.structure[structre_valid, 1], structre_ctrl[structre_valid]) |
| mem_offset[:-1] -= structre_delete.int() |
| new_structre_idx = torch.arange(0, self.num_non_leaf_nodes + 1, dtype=torch.int32, device=self.device) + mem_offset.cumsum(0) |
| new_structure_length = new_structre_idx[-1].item() |
| new_structre_idx = new_structre_idx[:-1] |
| new_structure = torch.empty((new_structure_length, 3), dtype=torch.int32, device=self.device) |
| new_structure[new_structre_idx[structre_valid], 0] = new_leaf_num[structre_valid] |
|
|
| |
| new_node_mask = torch.ones((new_structure_length,), dtype=torch.bool, device=self.device) |
| new_node_mask[new_structre_idx[structre_valid]] = False |
| new_structure[new_node_mask, 0] = 8 |
| new_node_num = new_node_mask.sum().item() |
|
|
| |
| non_leaf_cnt = 8 - new_structure[:, 0] |
| new_child_ptr = torch.cat([torch.zeros((1,), dtype=torch.int32, device=self.device), non_leaf_cnt.cumsum(0)[:-1]]) |
| new_structure[:, 1] = new_child_ptr + 1 |
|
|
| |
| leaf_cnt = torch.zeros((new_structure_length,), dtype=torch.int32, device=self.device) |
| leaf_cnt.index_add_(0, new_structre_idx, self.structure[:, 0]) |
| old_data_ptr = torch.cat([torch.zeros((1,), dtype=torch.int32, device=self.device), leaf_cnt.cumsum(0)[:-1]]) |
|
|
| |
| subdivide_mask = mask == 1 |
| merge_mask = mask == -1 |
| data_valid = ~(subdivide_mask | merge_mask) |
| mem_offset = torch.zeros((self.num_leaf_nodes + 1,), dtype=torch.int32, device=self.device) |
| mem_offset.index_add_(0, old_data_ptr[new_node_mask], torch.full((new_node_num,), 8, dtype=torch.int32, device=self.device)) |
| mem_offset[:-1] -= subdivide_mask.int() |
| mem_offset[:-1] -= merge_mask.int() |
| mem_offset.index_add_(0, self.structure[structre_valid, 2], merged_nodes[structre_valid]) |
| new_data_idx = torch.arange(0, self.num_leaf_nodes + 1, dtype=torch.int32, device=self.device) + mem_offset.cumsum(0) |
| new_data_length = new_data_idx[-1].item() |
| new_data_idx = new_data_idx[:-1] |
| new_data = {data: torch.empty((new_data_length,) + getattr(self, data).shape[1:], dtype=getattr(self, data).dtype, device=self.device) for data in self.data} |
| for data in self.data: |
| new_data[data][new_data_idx[data_valid]] = getattr(self, data)[data_valid] |
|
|
| |
| leaf_cnt = new_structure[:, 0] |
| new_data_ptr = torch.cat([torch.zeros((1,), dtype=torch.int32, device=self.device), leaf_cnt.cumsum(0)[:-1]]) |
| new_structure[:, 2] = new_data_ptr |
|
|
| |
| |
| if subdivide_mask.sum() > 0: |
| subdivide_data_ptr = new_structure[new_node_mask, 2] |
| for data in self.data: |
| for i in range(8): |
| if data == 'position': |
| offset = torch.tensor([i // 4, (i // 2) % 2, i % 2], dtype=torch.float32, device=self.device) - 0.5 |
| scale = 2 ** (-1.0 - self.depth[subdivide_mask]) |
| new_data['position'][subdivide_data_ptr + i] = self.position[subdivide_mask] + offset * scale |
| elif data == 'depth': |
| new_data['depth'][subdivide_data_ptr + i] = self.depth[subdivide_mask] + 1 |
| elif data == 'opacity': |
| new_data['opacity'][subdivide_data_ptr + i] = self.inverse_opacity_activation(torch.sqrt(self.opacity_activation(self.opacity[subdivide_mask]))) |
| elif data == 'trivec': |
| offset = torch.tensor([i // 4, (i // 2) % 2, i % 2], dtype=torch.float32, device=self.device) * 0.5 |
| coord = (torch.linspace(0, 0.5, self.trivec.shape[-1], dtype=torch.float32, device=self.device)[None] + offset[:, None]).reshape(1, 3, self.trivec.shape[-1], 1) |
| axis = torch.linspace(0, 1, 3, dtype=torch.float32, device=self.device).reshape(1, 3, 1, 1).repeat(1, 1, self.trivec.shape[-1], 1) |
| coord = torch.stack([coord, axis], dim=3).reshape(1, 3, self.trivec.shape[-1], 2).expand(self.trivec[subdivide_mask].shape[0], -1, -1, -1) * 2 - 1 |
| new_data['trivec'][subdivide_data_ptr + i] = F.grid_sample(self.trivec[subdivide_mask], coord, align_corners=True) |
| else: |
| new_data[data][subdivide_data_ptr + i] = getattr(self, data)[subdivide_mask] |
| |
| if merge_mask.sum() > 0: |
| merge_data_ptr = torch.empty((merged_nodes.sum().item(),), dtype=torch.int32, device=self.device) |
| merge_nodes_cumsum = torch.cat([torch.zeros((1,), dtype=torch.int32, device=self.device), merged_nodes.cumsum(0)[:-1]]) |
| for i in range(8): |
| merge_data_ptr[merge_nodes_cumsum[merged_nodes > i] + i] = new_structure[new_structre_idx[merged_nodes > i], 2] + i |
| old_merge_data_ptr = self.structure[structre_delete, 2] |
| for data in self.data: |
| if data == 'position': |
| scale = 2 ** (1.0 - self.depth[old_merge_data_ptr]) |
| new_data['position'][merge_data_ptr] = ((self.position[old_merge_data_ptr] + 0.5) / scale).floor() * scale + 0.5 * scale - 0.5 |
| elif data == 'depth': |
| new_data['depth'][merge_data_ptr] = self.depth[old_merge_data_ptr] - 1 |
| elif data == 'opacity': |
| new_data['opacity'][subdivide_data_ptr + i] = self.inverse_opacity_activation(self.opacity_activation(self.opacity[subdivide_mask])**2) |
| elif data == 'trivec': |
| new_data['trivec'][merge_data_ptr] = self.trivec[old_merge_data_ptr] |
| else: |
| new_data[data][merge_data_ptr] = getattr(self, data)[old_merge_data_ptr] |
|
|
| |
| self.structure = new_structure |
| for data in self.data: |
| setattr(self, data, new_data[data]) |
|
|
| |
| self.data_rearrange_buffer = { |
| 'subdivide_mask': subdivide_mask, |
| 'merge_mask': merge_mask, |
| 'data_valid': data_valid, |
| 'new_data_idx': new_data_idx, |
| 'new_data_length': new_data_length, |
| 'new_data': new_data |
| } |
|
|