Spaces:

gregorkrzmanc
/

HitPF_demo

Sleeping

HitPF_demo / src /layers /utils_training.py

github-actions[bot]

Sync from GitHub f6dbbfb

cc0720f about 1 month ago

6.75 kB


	from lightning.pytorch.callbacks import BaseFinetuning
	import torch
	import dgl
	from src.layers.inference_oc import DPC_custom_CLD
	from src.layers.inference_oc import match_showers
	from src.layers.inference_oc import remove_bad_tracks_from_cluster
	class FreezeClustering(BaseFinetuning):
	def __init__(
	self,
	):
	super().__init__()

	def freeze_before_training(self, pl_module):
	self.freeze(pl_module.ScaledGooeyBatchNorm2_1)
	self.freeze(pl_module.gatr)
	self.freeze(pl_module.clustering)
	self.freeze(pl_module.beta)

	print("CLUSTERING HAS BEEN FROOOZEN")

	def finetune_function(self, pl_module, current_epoch, optimizer):
	print("Not finetunning")



	def obtain_batch_numbers(x, g):
	dev = x.device
	graphs_eval = dgl.unbatch(g)
	number_graphs = len(graphs_eval)
	batch_numbers = []
	for index in range(0, number_graphs):
	gj = graphs_eval[index]
	num_nodes = gj.number_of_nodes()
	batch_numbers.append(index * torch.ones(num_nodes).to(dev))
	# num_nodes = gj.number_of_nodes()

	batch = torch.cat(batch_numbers, dim=0)
	return batch



	def obtain_clustering_for_matched_showers(
	batch_g, model_output, y_all, local_rank, use_gt_clusters=False, add_fakes=True
	):

	graphs_showers_matched = []
	graphs_showers_fakes = []
	true_energy_showers = []
	reco_energy_showers = []
	reco_energy_showers_fakes = []
	energy_true_daughters = []
	y_pids_matched = []
	y_coords_matched = []
	if not use_gt_clusters:
	batch_g.ndata["coords"] = model_output[:, 0:3]
	batch_g.ndata["beta"] = model_output[:, 3]
	graphs = dgl.unbatch(batch_g)
	batch_id = y_all.batch_number
	for i in range(0, len(graphs)):
	mask = batch_id == i
	dic = {}
	dic["graph"] = graphs[i]
	y = y_all.copy()

	y.mask(mask.flatten())
	dic["part_true"] = y
	if not use_gt_clusters:
	betas = torch.sigmoid(dic["graph"].ndata["beta"])
	X = dic["graph"].ndata["coords"]

	if use_gt_clusters:
	labels = dic["graph"].ndata["particle_number"].type(torch.int64)
	else:
	labels =DPC_custom_CLD(X, dic["graph"], model_output.device)

	labels, _ = remove_bad_tracks_from_cluster(dic["graph"], labels)
	particle_ids = torch.unique(dic["graph"].ndata["particle_number"])
	shower_p_unique = torch.unique(labels)
	shower_p_unique, row_ind, col_ind, i_m_w, _ = match_showers(
	labels, dic, particle_ids, model_output, local_rank, i, None
	)
	row_ind = torch.Tensor(row_ind).to(model_output.device).long()
	col_ind = torch.Tensor(col_ind).to(model_output.device).long()
	if torch.sum(particle_ids == 0) > 0:
	row_ind_ = row_ind - 1
	else:
	# if there is no zero then index 0 corresponds to particle 1.
	row_ind_ = row_ind
	index_matches = col_ind + 1
	index_matches = index_matches.to(model_output.device).long()

	for j, unique_showers_label in enumerate(index_matches):
	if torch.sum(unique_showers_label == index_matches) == 1:
	index_in_matched = torch.argmax(
	(unique_showers_label == index_matches) * 1
	)
	mask = labels == unique_showers_label
	sls_graph = graphs[i].ndata["pos_hits_xyz"][mask][:, 0:3]
	g = dgl.graph(([], []))
	g.add_nodes(sls_graph.shape[0])
	g = g.to(sls_graph.device)
	g.ndata["h"] = graphs[i].ndata["h"][mask]
	if "pos_pxpypz" in graphs[i].ndata:
	g.ndata["pos_pxpypz"] = graphs[i].ndata["pos_pxpypz"][mask]
	if "pos_pxpypz_at_vertex" in graphs[i].ndata:
	g.ndata["pos_pxpypz_at_vertex"] = graphs[i].ndata[
	"pos_pxpypz_at_vertex"
	][mask]
	g.ndata["chi_squared_tracks"] = graphs[i].ndata["chi_squared_tracks"][mask]
	energy_t = dic["part_true"].E.to(model_output.device)
	energy_t_corr_daughters = dic["part_true"].m.to(
	model_output.device
	)
	true_energy_shower = energy_t[row_ind_[j]]
	y_pids_matched.append(y.pid[row_ind_[j]].item())
	y_coords_matched.append(y.coord[row_ind_[j]].detach().cpu().numpy())
	energy_true_daughters.append(energy_t_corr_daughters[row_ind_[j]])
	reco_energy_shower = torch.sum(graphs[i].ndata["e_hits"][mask])
	graphs_showers_matched.append(g)
	true_energy_showers.append(true_energy_shower.view(-1))
	reco_energy_showers.append(reco_energy_shower.view(-1))
	pred_showers = shower_p_unique
	pred_showers[index_matches] = -1
	pred_showers[
	0
	] = (
	-1
	)
	mask_fakes = pred_showers != -1
	fakes_idx = torch.where(mask_fakes)[0]
	if add_fakes:
	for j in fakes_idx:
	mask = labels == j
	sls_graph = graphs[i].ndata["pos_hits_xyz"][mask][:, 0:3]
	g = dgl.graph(([], []))
	g.add_nodes(sls_graph.shape[0])
	g = g.to(sls_graph.device)

	g.ndata["h"] = graphs[i].ndata["h"][mask]

	if "pos_pxpypz" in graphs[i].ndata:
	g.ndata["pos_pxpypz"] = graphs[i].ndata["pos_pxpypz"][mask]
	if "pos_pxpypz_at_vertex" in graphs[i].ndata:
	g.ndata["pos_pxpypz_at_vertex"] = graphs[i].ndata[
	"pos_pxpypz_at_vertex"
	][mask]
	g.ndata["chi_squared_tracks"] = graphs[i].ndata["chi_squared_tracks"][mask]
	graphs_showers_fakes.append(g)
	reco_energy_shower = torch.sum(graphs[i].ndata["e_hits"][mask])
	reco_energy_showers_fakes.append(reco_energy_shower.view(-1))
	graphs_showers_matched = dgl.batch(graphs_showers_matched + graphs_showers_fakes)
	true_energy_showers = torch.cat(true_energy_showers, dim=0)
	reco_energy_showers = torch.cat(reco_energy_showers + reco_energy_showers_fakes, dim=0)
	e_true_corr_daughters = torch.cat(energy_true_daughters, dim=0)
	number_of_fakes = len(reco_energy_showers_fakes)
	return (
	graphs_showers_matched,
	true_energy_showers,
	reco_energy_showers,
	y_pids_matched,
	e_true_corr_daughters,
	y_coords_matched,
	number_of_fakes,
	fakes_idx
	)