Spaces:

mohaed
/

3dAnimation

Sleeping

3dAnimation / motion_diffusion_model /data_loaders /tensors.py

megalado

Add local model code; tidy requirements

f87d582 8 months ago

3.56 kB

	import torch

	def lengths_to_mask(lengths, max_len):
	# max_len = max(lengths)
	mask = torch.arange(max_len, device=lengths.device).expand(len(lengths), max_len) < lengths.unsqueeze(1)
	return mask


	def collate_tensors(batch):
	dims = batch[0].dim()
	max_size = [max([b.size(i) for b in batch]) for i in range(dims)]
	size = (len(batch),) + tuple(max_size)
	canvas = batch[0].new_zeros(size=size)
	for i, b in enumerate(batch):
	sub_tensor = canvas[i]
	for d in range(dims):
	sub_tensor = sub_tensor.narrow(d, 0, b.size(d))
	sub_tensor.add_(b)
	return canvas


	def collate(batch):
	notnone_batches = [b for b in batch if b is not None]
	databatch = [b['inp'] for b in notnone_batches]
	if 'lengths' in notnone_batches[0]:
	lenbatch = [b['lengths'] for b in notnone_batches]
	else:
	lenbatch = [len(b['inp'][0][0]) for b in notnone_batches]


	databatchTensor = collate_tensors(databatch)
	lenbatchTensor = torch.as_tensor(lenbatch)
	maskbatchTensor = lengths_to_mask(lenbatchTensor, databatchTensor.shape[-1]).unsqueeze(1).unsqueeze(1) # unqueeze for broadcasting

	motion = databatchTensor
	cond = {'y': {'mask': maskbatchTensor, 'lengths': lenbatchTensor}}

	if 'text' in notnone_batches[0]:
	textbatch = [b['text'] for b in notnone_batches]
	cond['y'].update({'text': textbatch})

	if 'tokens' in notnone_batches[0]:
	textbatch = [b['tokens'] for b in notnone_batches]
	cond['y'].update({'tokens': textbatch})

	if 'action' in notnone_batches[0]:
	actionbatch = [b['action'] for b in notnone_batches]
	cond['y'].update({'action': torch.as_tensor(actionbatch).unsqueeze(1)})

	# collate action textual names
	if 'action_text' in notnone_batches[0]:
	action_text = [b['action_text']for b in notnone_batches]
	cond['y'].update({'action_text': action_text})

	if 'prefix' in notnone_batches[0]:
	cond['y'].update({'prefix': collate_tensors([b['prefix'] for b in notnone_batches])})

	if 'orig_lengths' in notnone_batches[0]:
	cond['y'].update({'orig_lengths': torch.as_tensor([b['orig_lengths'] for b in notnone_batches])})

	if 'key' in notnone_batches[0]:
	cond['y'].update({'db_key': [b['key'] for b in notnone_batches]})

	return motion, cond

	# an adapter to our collate func
	def t2m_collate(batch, target_batch_size):
	repeat_factor = -(-target_batch_size // len(batch)) # Ceiling division
	repeated_batch = batch * repeat_factor
	full_batch = repeated_batch[:target_batch_size] # Truncate to the target batch size
	# batch.sort(key=lambda x: x[3], reverse=True)
	adapted_batch = [{
	'inp': torch.tensor(b[4].T).float().unsqueeze(1), # [seqlen, J] -> [J, 1, seqlen]
	'text': b[2], #b[0]['caption']
	'tokens': b[6],
	'lengths': b[5],
	'key': b[7] if len(b) > 7 else None,
	} for b in full_batch]
	return collate(adapted_batch)


	def t2m_prefix_collate(batch, pred_len):
	# batch.sort(key=lambda x: x[3], reverse=True)
	adapted_batch = [{
	'inp': torch.tensor(b[4].T).float().unsqueeze(1)[..., -pred_len:], # [seqlen, J] -> [J, 1, seqlen]
	'prefix': torch.tensor(b[4].T).float().unsqueeze(1)[..., :-pred_len],
	'text': b[2], #b[0]['caption']
	'tokens': b[6],
	'lengths': pred_len, # b[5],
	'orig_lengths': b[5][0], # For evaluation
	'key': b[7] if len(b) > 7 else None,
	} for b in batch]
	return collate(adapted_batch)