|
|
|
import sys |
|
from collections.abc import Iterable |
|
from multiprocessing import Pool |
|
from shutil import get_terminal_size |
|
|
|
from .timer import Timer |
|
|
|
|
|
class ProgressBar: |
|
"""A progress bar which can print the progress.""" |
|
|
|
def __init__(self, task_num=0, bar_width=50, start=True, file=sys.stdout): |
|
self.task_num = task_num |
|
self.bar_width = bar_width |
|
self.completed = 0 |
|
self.file = file |
|
if start: |
|
self.start() |
|
|
|
@property |
|
def terminal_width(self): |
|
width, _ = get_terminal_size() |
|
return width |
|
|
|
def start(self): |
|
if self.task_num > 0: |
|
self.file.write(f'[{" " * self.bar_width}] 0/{self.task_num}, ' |
|
'elapsed: 0s, ETA:') |
|
else: |
|
self.file.write('completed: 0, elapsed: 0s') |
|
self.file.flush() |
|
self.timer = Timer() |
|
|
|
def update(self, num_tasks=1): |
|
assert num_tasks > 0 |
|
self.completed += num_tasks |
|
elapsed = self.timer.since_start() |
|
if elapsed > 0: |
|
fps = self.completed / elapsed |
|
else: |
|
fps = float('inf') |
|
if self.task_num > 0: |
|
percentage = self.completed / float(self.task_num) |
|
eta = int(elapsed * (1 - percentage) / percentage + 0.5) |
|
msg = f'\r[{{}}] {self.completed}/{self.task_num}, ' \ |
|
f'{fps:.1f} task/s, elapsed: {int(elapsed + 0.5)}s, ' \ |
|
f'ETA: {eta:5}s' |
|
|
|
bar_width = min(self.bar_width, |
|
int(self.terminal_width - len(msg)) + 2, |
|
int(self.terminal_width * 0.6)) |
|
bar_width = max(2, bar_width) |
|
mark_width = int(bar_width * percentage) |
|
bar_chars = '>' * mark_width + ' ' * (bar_width - mark_width) |
|
self.file.write(msg.format(bar_chars)) |
|
else: |
|
self.file.write( |
|
f'completed: {self.completed}, elapsed: {int(elapsed + 0.5)}s,' |
|
f' {fps:.1f} tasks/s') |
|
self.file.flush() |
|
|
|
|
|
def track_progress(func, tasks, bar_width=50, file=sys.stdout, **kwargs): |
|
"""Track the progress of tasks execution with a progress bar. |
|
|
|
Tasks are done with a simple for-loop. |
|
|
|
Args: |
|
func (callable): The function to be applied to each task. |
|
tasks (list or tuple[Iterable, int]): A list of tasks or |
|
(tasks, total num). |
|
bar_width (int): Width of progress bar. |
|
|
|
Returns: |
|
list: The task results. |
|
""" |
|
if isinstance(tasks, tuple): |
|
assert len(tasks) == 2 |
|
assert isinstance(tasks[0], Iterable) |
|
assert isinstance(tasks[1], int) |
|
task_num = tasks[1] |
|
tasks = tasks[0] |
|
elif isinstance(tasks, Iterable): |
|
task_num = len(tasks) |
|
else: |
|
raise TypeError( |
|
'"tasks" must be an iterable object or a (iterator, int) tuple') |
|
prog_bar = ProgressBar(task_num, bar_width, file=file) |
|
results = [] |
|
for task in tasks: |
|
results.append(func(task, **kwargs)) |
|
prog_bar.update() |
|
prog_bar.file.write('\n') |
|
return results |
|
|
|
|
|
def init_pool(process_num, initializer=None, initargs=None): |
|
if initializer is None: |
|
return Pool(process_num) |
|
elif initargs is None: |
|
return Pool(process_num, initializer) |
|
else: |
|
if not isinstance(initargs, tuple): |
|
raise TypeError('"initargs" must be a tuple') |
|
return Pool(process_num, initializer, initargs) |
|
|
|
|
|
def track_parallel_progress(func, |
|
tasks, |
|
nproc, |
|
initializer=None, |
|
initargs=None, |
|
bar_width=50, |
|
chunksize=1, |
|
skip_first=False, |
|
keep_order=True, |
|
file=sys.stdout): |
|
"""Track the progress of parallel task execution with a progress bar. |
|
|
|
The built-in :mod:`multiprocessing` module is used for process pools and |
|
tasks are done with :func:`Pool.map` or :func:`Pool.imap_unordered`. |
|
|
|
Args: |
|
func (callable): The function to be applied to each task. |
|
tasks (list or tuple[Iterable, int]): A list of tasks or |
|
(tasks, total num). |
|
nproc (int): Process (worker) number. |
|
initializer (None or callable): Refer to :class:`multiprocessing.Pool` |
|
for details. |
|
initargs (None or tuple): Refer to :class:`multiprocessing.Pool` for |
|
details. |
|
chunksize (int): Refer to :class:`multiprocessing.Pool` for details. |
|
bar_width (int): Width of progress bar. |
|
skip_first (bool): Whether to skip the first sample for each worker |
|
when estimating fps, since the initialization step may takes |
|
longer. |
|
keep_order (bool): If True, :func:`Pool.imap` is used, otherwise |
|
:func:`Pool.imap_unordered` is used. |
|
|
|
Returns: |
|
list: The task results. |
|
""" |
|
if isinstance(tasks, tuple): |
|
assert len(tasks) == 2 |
|
assert isinstance(tasks[0], Iterable) |
|
assert isinstance(tasks[1], int) |
|
task_num = tasks[1] |
|
tasks = tasks[0] |
|
elif isinstance(tasks, Iterable): |
|
task_num = len(tasks) |
|
else: |
|
raise TypeError( |
|
'"tasks" must be an iterable object or a (iterator, int) tuple') |
|
pool = init_pool(nproc, initializer, initargs) |
|
start = not skip_first |
|
task_num -= nproc * chunksize * int(skip_first) |
|
prog_bar = ProgressBar(task_num, bar_width, start, file=file) |
|
results = [] |
|
if keep_order: |
|
gen = pool.imap(func, tasks, chunksize) |
|
else: |
|
gen = pool.imap_unordered(func, tasks, chunksize) |
|
for result in gen: |
|
results.append(result) |
|
if skip_first: |
|
if len(results) < nproc * chunksize: |
|
continue |
|
elif len(results) == nproc * chunksize: |
|
prog_bar.start() |
|
continue |
|
prog_bar.update() |
|
prog_bar.file.write('\n') |
|
pool.close() |
|
pool.join() |
|
return results |
|
|
|
|
|
def track_iter_progress(tasks, bar_width=50, file=sys.stdout): |
|
"""Track the progress of tasks iteration or enumeration with a progress |
|
bar. |
|
|
|
Tasks are yielded with a simple for-loop. |
|
|
|
Args: |
|
tasks (list or tuple[Iterable, int]): A list of tasks or |
|
(tasks, total num). |
|
bar_width (int): Width of progress bar. |
|
|
|
Yields: |
|
list: The task results. |
|
""" |
|
if isinstance(tasks, tuple): |
|
assert len(tasks) == 2 |
|
assert isinstance(tasks[0], Iterable) |
|
assert isinstance(tasks[1], int) |
|
task_num = tasks[1] |
|
tasks = tasks[0] |
|
elif isinstance(tasks, Iterable): |
|
task_num = len(tasks) |
|
else: |
|
raise TypeError( |
|
'"tasks" must be an iterable object or a (iterator, int) tuple') |
|
prog_bar = ProgressBar(task_num, bar_width, file=file) |
|
for task in tasks: |
|
yield task |
|
prog_bar.update() |
|
prog_bar.file.write('\n') |
|
|