| |
| import sys |
| from collections.abc import Iterable |
| from multiprocessing import Pool |
| from shutil import get_terminal_size |
|
|
| from .timer import Timer |
|
|
|
|
| class ProgressBar: |
| """A progress bar which can print the progress.""" |
|
|
| def __init__(self, task_num=0, bar_width=50, start=True, file=sys.stdout): |
| self.task_num = task_num |
| self.bar_width = bar_width |
| self.completed = 0 |
| self.file = file |
| if start: |
| self.start() |
|
|
| @property |
| def terminal_width(self): |
| width, _ = get_terminal_size() |
| return width |
|
|
| def start(self): |
| if self.task_num > 0: |
| self.file.write(f'[{" " * self.bar_width}] 0/{self.task_num}, ' |
| 'elapsed: 0s, ETA:') |
| else: |
| self.file.write('completed: 0, elapsed: 0s') |
| self.file.flush() |
| self.timer = Timer() |
|
|
| def update(self, num_tasks=1): |
| assert num_tasks > 0 |
| self.completed += num_tasks |
| elapsed = self.timer.since_start() |
| if elapsed > 0: |
| fps = self.completed / elapsed |
| else: |
| fps = float('inf') |
| if self.task_num > 0: |
| percentage = self.completed / float(self.task_num) |
| eta = int(elapsed * (1 - percentage) / percentage + 0.5) |
| msg = f'\r[{{}}] {self.completed}/{self.task_num}, ' \ |
| f'{fps:.1f} task/s, elapsed: {int(elapsed + 0.5)}s, ' \ |
| f'ETA: {eta:5}s' |
|
|
| bar_width = min(self.bar_width, |
| int(self.terminal_width - len(msg)) + 2, |
| int(self.terminal_width * 0.6)) |
| bar_width = max(2, bar_width) |
| mark_width = int(bar_width * percentage) |
| bar_chars = '>' * mark_width + ' ' * (bar_width - mark_width) |
| self.file.write(msg.format(bar_chars)) |
| else: |
| self.file.write( |
| f'completed: {self.completed}, elapsed: {int(elapsed + 0.5)}s,' |
| f' {fps:.1f} tasks/s') |
| self.file.flush() |
|
|
|
|
| def track_progress(func, tasks, bar_width=50, file=sys.stdout, **kwargs): |
| """Track the progress of tasks execution with a progress bar. |
| |
| Tasks are done with a simple for-loop. |
| |
| Args: |
| func (callable): The function to be applied to each task. |
| tasks (list or tuple[Iterable, int]): A list of tasks or |
| (tasks, total num). |
| bar_width (int): Width of progress bar. |
| |
| Returns: |
| list: The task results. |
| """ |
| if isinstance(tasks, tuple): |
| assert len(tasks) == 2 |
| assert isinstance(tasks[0], Iterable) |
| assert isinstance(tasks[1], int) |
| task_num = tasks[1] |
| tasks = tasks[0] |
| elif isinstance(tasks, Iterable): |
| task_num = len(tasks) |
| else: |
| raise TypeError( |
| '"tasks" must be an iterable object or a (iterator, int) tuple') |
| prog_bar = ProgressBar(task_num, bar_width, file=file) |
| results = [] |
| for task in tasks: |
| results.append(func(task, **kwargs)) |
| prog_bar.update() |
| prog_bar.file.write('\n') |
| return results |
|
|
|
|
| def init_pool(process_num, initializer=None, initargs=None): |
| if initializer is None: |
| return Pool(process_num) |
| elif initargs is None: |
| return Pool(process_num, initializer) |
| else: |
| if not isinstance(initargs, tuple): |
| raise TypeError('"initargs" must be a tuple') |
| return Pool(process_num, initializer, initargs) |
|
|
|
|
| def track_parallel_progress(func, |
| tasks, |
| nproc, |
| initializer=None, |
| initargs=None, |
| bar_width=50, |
| chunksize=1, |
| skip_first=False, |
| keep_order=True, |
| file=sys.stdout): |
| """Track the progress of parallel task execution with a progress bar. |
| |
| The built-in :mod:`multiprocessing` module is used for process pools and |
| tasks are done with :func:`Pool.map` or :func:`Pool.imap_unordered`. |
| |
| Args: |
| func (callable): The function to be applied to each task. |
| tasks (list or tuple[Iterable, int]): A list of tasks or |
| (tasks, total num). |
| nproc (int): Process (worker) number. |
| initializer (None or callable): Refer to :class:`multiprocessing.Pool` |
| for details. |
| initargs (None or tuple): Refer to :class:`multiprocessing.Pool` for |
| details. |
| chunksize (int): Refer to :class:`multiprocessing.Pool` for details. |
| bar_width (int): Width of progress bar. |
| skip_first (bool): Whether to skip the first sample for each worker |
| when estimating fps, since the initialization step may takes |
| longer. |
| keep_order (bool): If True, :func:`Pool.imap` is used, otherwise |
| :func:`Pool.imap_unordered` is used. |
| |
| Returns: |
| list: The task results. |
| """ |
| if isinstance(tasks, tuple): |
| assert len(tasks) == 2 |
| assert isinstance(tasks[0], Iterable) |
| assert isinstance(tasks[1], int) |
| task_num = tasks[1] |
| tasks = tasks[0] |
| elif isinstance(tasks, Iterable): |
| task_num = len(tasks) |
| else: |
| raise TypeError( |
| '"tasks" must be an iterable object or a (iterator, int) tuple') |
| pool = init_pool(nproc, initializer, initargs) |
| start = not skip_first |
| task_num -= nproc * chunksize * int(skip_first) |
| prog_bar = ProgressBar(task_num, bar_width, start, file=file) |
| results = [] |
| if keep_order: |
| gen = pool.imap(func, tasks, chunksize) |
| else: |
| gen = pool.imap_unordered(func, tasks, chunksize) |
| for result in gen: |
| results.append(result) |
| if skip_first: |
| if len(results) < nproc * chunksize: |
| continue |
| elif len(results) == nproc * chunksize: |
| prog_bar.start() |
| continue |
| prog_bar.update() |
| prog_bar.file.write('\n') |
| pool.close() |
| pool.join() |
| return results |
|
|
|
|
| def track_iter_progress(tasks, bar_width=50, file=sys.stdout): |
| """Track the progress of tasks iteration or enumeration with a progress |
| bar. |
| |
| Tasks are yielded with a simple for-loop. |
| |
| Args: |
| tasks (list or tuple[Iterable, int]): A list of tasks or |
| (tasks, total num). |
| bar_width (int): Width of progress bar. |
| |
| Yields: |
| list: The task results. |
| """ |
| if isinstance(tasks, tuple): |
| assert len(tasks) == 2 |
| assert isinstance(tasks[0], Iterable) |
| assert isinstance(tasks[1], int) |
| task_num = tasks[1] |
| tasks = tasks[0] |
| elif isinstance(tasks, Iterable): |
| task_num = len(tasks) |
| else: |
| raise TypeError( |
| '"tasks" must be an iterable object or a (iterator, int) tuple') |
| prog_bar = ProgressBar(task_num, bar_width, file=file) |
| for task in tasks: |
| yield task |
| prog_bar.update() |
| prog_bar.file.write('\n') |
|
|