BryanW
/

43

Model card Files Files and versions

43 / Meissonic /InfinityStar /infinity /models /videovae /utils /diffdist /extra_collectives.py

BryanW's picture

Upload folder using huggingface_hub

3d1c0e1 verified 4 months ago

history blame contribute delete

1.25 kB

	# Copyright (c) 2025 FoundationVision
	# SPDX-License-Identifier: MIT
	import torch.distributed as dist
	from torch.distributed import ReduceOp


	class AsyncOpList(object):
	def __init__(self, ops):
	self.ops = ops

	def wait(self):
	for op in self.ops:
	op.wait()

	def is_completed(self):
	for op in self.ops:
	if not op.is_completed():
	return False
	return True


	def reduce_scatter(tensor,
	tensor_list,
	op=ReduceOp.SUM,
	group=dist.group.WORLD,
	async_op=False):
	ranks = dist.get_process_group_ranks(group)
	rank = dist.get_rank(group)
	if tensor is None:
	tensor = tensor_list[rank]
	if tensor.dim() == 0:
	tensor = tensor.view(-1)
	tensor[:] = tensor_list[rank]
	ops = []
	for i in range(dist.get_world_size(group)):
	if i == rank:
	tmp = dist.reduce(tensor.contiguous(), ranks[i], op, group, async_op=True)
	else:
	tmp = dist.reduce(tensor_list[i].contiguous(), ranks[i], op, group, async_op=True)
	ops.append(tmp)

	oplist = AsyncOpList(ops)
	if async_op:
	return oplist
	else:
	oplist.wait()