UMMJ
/

JSX_TTS

Model card Files Files and versions

JSX_TTS / torch /distributed /pipeline /sync /_balance /blockpartition.py

UMMJ's picture

Upload 5875 files

9dd3461 about 3 years ago

history blame contribute delete

3.19 kB

	# -- coding: utf-8 --
	# Copyright 2019 Kakao Brain
	#
	# Copyright (c) Facebook, Inc. and its affiliates. All rights reserved.
	#
	# This source code is licensed under the BSD license found in the
	# LICENSE file in the root directory of this source tree.
	"""Implements "Block Partitions of Sequences" by Imre Bárány et al.

	Paper: https://arxiv.org/pdf/1308.2452.pdf

	"""
	from typing import Iterator, List, Tuple

	__all__ = ["solve"]


	def solve(sequence: List[int], partitions: int = 1) -> List[List[int]]:
	"""Splits a sequence into several partitions to minimize variance for each
	partition.

	The result might not be optimal. However, it can be done only in O(kn³),
	where k is the number of partitions and n is the length of the sequence.

	"""
	if partitions < 1:
	raise ValueError(f"partitions must be a positive integer ({partitions} < 1)")

	n = len(sequence)
	if n < partitions:
	raise ValueError(f"sequence is shorter than intended partitions ({n} < {partitions})")

	# Normalize the sequence in [0, 1].
	minimum = min(sequence)
	maximum = max(sequence) - minimum

	normal_sequence: List[float]
	if maximum == 0:
	normal_sequence = [0 for _ in sequence]
	else:
	normal_sequence = [(x - minimum) / maximum for x in sequence]

	splits = [n // partitions * (x + 1) for x in range(partitions - 1)] + [n]

	def block_size(i: int) -> float:
	start = splits[i - 1] if i > 0 else 0
	stop = splits[i]
	return sum(normal_sequence[start:stop])

	def leaderboard() -> Iterator[Tuple[float, int]]:
	return ((block_size(i), i) for i in range(partitions))

	while True:
	"""
	(1) Fix p ∈ [k] with M(P) = bp. So Bp is a maximal block of P.
	"""
	# max_size: M(P)
	max_size, p = max(leaderboard())

	while True:
	"""
	(2) If M(P) ≤ m(P) + 1, then stop.
	"""
	# min_size: m(P)
	min_size, q = min(leaderboard())

	if max_size <= min_size + 1:
	return [sequence[i:j] for i, j in zip([0] + splits[:-1], splits)]

	"""
	(3) If M(P) > m(P) + 1, then let m(P) = bq for the q ∈ [k] which is
	closest to p (ties broken arbitrarily). Thus Bq is a minimal block
	of P. Let Bh be the block next to Bq between Bp and Bq. (Note that
	Bh is a non-empty block: if it were, then m(P) = 0 and we should
	have chosen Bh instead of Bq.)
	"""
	if p < q:
	"""
	So either p < q and then h = q−1 and we define P ∗ by moving
	the last element from Bh = Bq−1 to Bq,
	"""
	h = q - 1
	splits[h] -= 1
	else:
	"""
	or q < p, and then h = q + 1 and P ∗ is obtained by moving the
	first element of Bh = Bq+1 to Bq.
	"""
	h = q + 1
	splits[q] += 1

	"""
	Set P = P ∗ . If p = h, then go to (1), else go to (2).
	"""
	if p == h:
	break