Spaces:

LINC-BIT
/

EdgeTA

Running

App Files Files Community

EdgeTA / utils /dl /common /model.py

LINC-BIT

Upload 1912 files

b84549f verified 12 months ago

raw

history blame contribute delete

21.1 kB

	import enum
	import time
	from typing import List, Tuple, Type
	import torch
	import warnings
	import os
	import thop

	from ...common.others import get_cur_time_str


	class ModelSaveMethod(enum.Enum):
	"""
	- WEIGHT: save model by `torch.save(model.state_dict(), ...)`
	- FULL: save model by `torch.save(model, ...)`
	- JIT: convert model to JIT format and save it by `torch.jit.save(jit_model, ...)`
	"""
	WEIGHT = 0
	FULL = 1
	JIT = 2


	def save_model(model: torch.nn.Module,
	model_file_path: str,
	save_method: ModelSaveMethod,
	model_input_size: Tuple[int]=None):
	"""Save a PyTorch model.

	Args:
	model (torch.nn.Module): A PyTorch model.
	model_file_path (str): Target model file path.
	save_method (ModelSaveMethod): The method to save model.
	model_input_size (Tuple[int], optional): \
	This is required if :attr:`save_method` is :attr:`ModelSaveMethod.JIT`. \
	Typically be `(1, 3, 32, 32)` or `(1, 3, 224, 224)`. \
	Defaults to None.
	"""

	model.eval()
	if save_method == ModelSaveMethod.WEIGHT:
	torch.save(model.state_dict(), model_file_path)

	elif save_method == ModelSaveMethod.FULL:
	with warnings.catch_warnings():
	warnings.simplefilter("ignore")
	torch.save(model, model_file_path)

	elif save_method == ModelSaveMethod.JIT:
	assert model_input_size is not None
	dummy_input = torch.ones(model_input_size, device=get_model_device(model))
	new_model = torch.jit.trace(model, dummy_input, check_trace=False)
	torch.jit.save(new_model, model_file_path)


	def get_model_size(model: torch.nn.Module, return_MB=False):
	"""Get size of a PyTorch model (default in Byte).

	Args:
	model (torch.nn.Module): A PyTorch model.
	return_MB (bool, optional): Return result in MB (/= 1024**2). Defaults to False.

	Returns:
	int: Model size.
	"""
	pid = os.getpid()
	tmp_model_file_path = './tmp-get-model-size-{}-{}.model'.format(pid, get_cur_time_str())
	save_model(model, tmp_model_file_path, ModelSaveMethod.WEIGHT)

	model_size = os.path.getsize(tmp_model_file_path)
	os.remove(tmp_model_file_path)

	if return_MB:
	model_size /= 1024**2

	return model_size


	def get_model_device(model: torch.nn.Module):
	"""Get device of a PyTorch model.

	Args:
	model (torch.nn.Module): A PyTorch model.

	Returns:
	str: The device of :attr:`model` ('cpu' or 'cuda:x').
	"""
	return list(model.parameters())[0].device


	def get_model_latency(model: torch.nn.Module, model_input_size: Tuple[int], sample_num: int,
	device: str, warmup_sample_num: int, return_detail=False):
	"""Get the latency (inference time) of a PyTorch model.

	Reference: https://deci.ai/resources/blog/measure-inference-time-deep-neural-networks/

	Args:
	model (torch.nn.Module): A PyTorch model.
	model_input_size (Tuple[int]): Typically be `(1, 3, 32, 32)` or `(1, 3, 224, 224)`.
	sample_num (int): How many inputs which size is :attr:`model_input_size` will be tested and compute the average latency as result.
	device (str): Typically be 'cpu' or 'cuda'.
	warmup_sample_num (int): Let model perform some dummy inference to warm up the test environment to avoid measurement loss.
	return_detail (bool, optional): Beside the average latency, return all result measured. Defaults to False.

	Returns:
	Union[float, Tuple[float, List[float]]]: The average latency (and all lantecy data) of :attr:`model`.
	"""
	if isinstance(model_input_size, tuple):
	dummy_input = torch.rand(model_input_size).to(device)
	else:
	dummy_input = model_input_size

	model = model.to(device)
	model.eval()

	# warm up
	with torch.no_grad():
	for _ in range(warmup_sample_num):
	model(dummy_input)

	infer_time_list = []

	if device == 'cuda' or 'cuda' in str(device):
	with torch.no_grad():
	for _ in range(sample_num):
	s, e = torch.cuda.Event(enable_timing=True), torch.cuda.Event(enable_timing=True)
	s.record()
	model(dummy_input)
	e.record()
	torch.cuda.synchronize()
	cur_model_infer_time = s.elapsed_time(e) / 1000.
	infer_time_list += [cur_model_infer_time]

	else:
	with torch.no_grad():
	for _ in range(sample_num):
	start = time.time()
	model(dummy_input)
	cur_model_infer_time = time.time() - start
	infer_time_list += [cur_model_infer_time]

	avg_infer_time = sum(infer_time_list) / sample_num

	if return_detail:
	return avg_infer_time, infer_time_list
	return avg_infer_time


	def get_model_flops_and_params(model: torch.nn.Module, model_input_size: Tuple[int], return_M=False):
	"""Get FLOPs and number of parameters of a PyTorch model.

	Args:
	model (torch.nn.Module): A PyTorch model.
	model_input_size (Tuple[int]): Typically be `(1, 3, 32, 32)` or `(1, 3, 224, 224)`.

	Returns:
	Tuple[float, float]: FLOPs and number of parameters of :attr:`model`.
	"""
	device = get_model_device(model)
	ops, param = thop.profile(model, (torch.ones(model_input_size).to(device), ), verbose=False)
	ops, param = ops * 2, param
	if return_M:
	ops, param = ops / 1e6, param / 1e6
	return ops, param


	def get_module(model: torch.nn.Module, module_name: str):
	"""Get a module from a PyTorch model.

	Example:
	>>> from torchvision.models import resnet18
	>>> model = resnet18()
	>>> get_module(model, 'layer1.0')
	BasicBlock(
	(conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
	(bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
	(relu): ReLU(inplace=True)
	(conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
	(bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
	)

	Args:
	model (torch.nn.Module): A PyTorch model.
	module_name (str): Module name.

	Returns:
	torch.nn.Module: Corrsponding module.
	"""
	for name, module in model.named_modules():
	if name == module_name:
	return module

	return None


	def get_parameter(model: torch.nn.Module, param_name: str):
	return getattr(
	get_module(model, '.'.join(param_name.split('.')[0: -1])),
	param_name.split('.')[-1]
	)


	def get_super_module(model: torch.nn.Module, module_name: str):
	"""Get the super module of a module in a PyTorch model.

	Example:
	>>> from torchvision.models import resnet18
	>>> model = resnet18()
	>>> get_super_module(model, 'layer1.0.conv1')
	BasicBlock(
	(conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
	(bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
	(relu): ReLU(inplace=True)
	(conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
	(bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
	)

	Args:
	model (torch.nn.Module): A PyTorch model.
	module_name (str): Module name.

	Returns:
	torch.nn.Module: Super module of module :attr:`module_name`.
	"""
	super_module_name = '.'.join(module_name.split('.')[0:-1])
	return get_module(model, super_module_name)


	def set_module(model: torch.nn.Module, module_name: str, module: torch.nn.Module):
	"""Set module in a PyTorch model.

	Example:
	>>> from torchvision.models import resnet18
	>>> model = resnet18()
	>>> set_module(model, 'layer1.0', torch.nn.Conv2d(64, 64, 3))
	>>> model
	ResNet(
	(conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
	(bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
	(relu): ReLU(inplace=True)
	(maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
	(layer1): Sequential(
	--> (0): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
	(1): BasicBlock(
	...
	)
	...
	)
	...
	)

	Args:
	model (torch.nn.Module): A PyTorch model.
	module_name (str): Module name.
	module (torch.nn.Module): Target module which will be set into :attr:`model`.
	"""
	super_module = get_super_module(model, module_name)
	setattr(super_module, module_name.split('.')[-1], module)


	def get_ith_layer(model: torch.nn.Module, i: int):
	"""Get i-th layer in a PyTorch model.

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> get_ith_layer(model, 5)
	Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))

	Args:
	model (torch.nn.Module): A PyTorch model.
	i (int): Index of target layer.

	Returns:
	torch.nn.Module: i-th layer in :attr:`model`.
	"""
	j = 0
	for module in model.modules():
	if len(list(module.children())) > 0:
	continue
	if j == i:
	return module
	j += 1
	return None


	def get_ith_layer_name(model: torch.nn.Module, i: int):
	"""Get the name of i-th layer in a PyTorch model.

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> get_ith_layer_name(model, 5)
	'features.5'

	Args:
	model (torch.nn.Module): A PyTorch model.
	i (int): Index of target layer.

	Returns:
	str: The name of i-th layer in :attr:`model`.
	"""
	j = 0
	for name, module in model.named_modules():
	if len(list(module.children())) > 0:
	continue
	if j == i:
	return name
	j += 1
	return None


	def set_ith_layer(model: torch.nn.Module, i: int, layer: torch.nn.Module):
	"""Set i-th layer in a PyTorch model.

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> model
	VGG(
	(features): Sequential(
	(0): Conv2d(3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
	(1): ReLU(inplace=True)
	(2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
	...
	)
	...
	)
	>>> set_ith_layer(model, 2, torch.nn.Conv2d(64, 128, 3))
	VGG(
	(features): Sequential(
	(0): Conv2d(3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
	(1): ReLU(inplace=True)
	--> (2): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
	...
	)
	...
	)

	Args:
	model (torch.nn.Module): A PyTorch model.
	i (int): Index of target layer.
	layer (torch.nn.Module): The layer which will be set into :attr:`model`.
	"""
	j = 0
	for name, module in model.named_modules():
	if len(list(module.children())) > 0:
	continue
	if j == i:
	set_module(model, name, layer)
	return
	j += 1


	def get_all_specific_type_layers_name(model: torch.nn.Module, types: Tuple[Type[torch.nn.Module]]):
	"""Get names of all layers which are give types in a PyTorch model. (e.g. `Conv2d`, `Linear`)

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> get_all_specific_type_layers_name(model, (torch.nn.Conv2d))
	['features.0', 'features.2', 'features.5', ...]

	Args:
	model (torch.nn.Module): A PyTorch model.
	types (Tuple[Type[torch.nn.Module]]): Target types, e.g. `(e.g. torch.nn.Conv2d, torch.nn.Linear)`

	Returns:
	List[str]: Names of all layers which are give types.
	"""
	res = []
	for name, m in model.named_modules():
	if isinstance(m, types):
	res += [name]
	return res


	class LayerActivation:
	"""Collect the input and output of a middle module of a PyTorch model during inference.

	Layer is a wide concept in this class. A module (e.g. ResBlock in ResNet) can be also regarded as a "layer".

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> # collect the input and output of 5th layer in VGG16
	>>> layer_activation = LayerActivation(get_ith_layer(model, 5), 'cuda')
	>>> model(torch.rand((1, 3, 224, 224)))
	>>> layer_activation.input
	tensor([[...]])
	>>> layer_activation.output
	tensor([[...]])
	>>> layer_activation.remove()
	"""
	def __init__(self, layer: torch.nn.Module, detach: bool, device: str):
	"""Register forward hook on corresponding layer.

	Args:
	layer (torch.nn.Module): Target layer.
	device (str): Where the collected data is located.
	"""
	self.hook = layer.register_forward_hook(self._hook_fn)
	self.detach = detach
	self.device = device
	self.input: torch.Tensor = None
	self.output: torch.Tensor = None
	self.layer = layer

	def __str__(self):
	return '- ' + str(self.layer)

	def _hook_fn(self, module, input, output):
	# TODO: input or output may be a tuple
	if isinstance(input, tuple):
	self.input = input[0].to(self.device)
	else:
	self.input = input.to(self.device)

	if isinstance(output, tuple):
	self.output = output[0].to(self.device)
	else:
	self.output = output.to(self.device)

	if self.detach:
	self.input = self.input.detach()
	self.output = self.output.detach()

	def remove(self):
	"""Remove the hook in the model to avoid performance effect.
	Use this after using the collected data.
	"""
	self.hook.remove()


	class LayerActivation2:
	"""Collect the input and output of a middle module of a PyTorch model during inference.

	Layer is a wide concept in this class. A module (e.g. ResBlock in ResNet) can be also regarded as a "layer".

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> # collect the input and output of 5th layer in VGG16
	>>> layer_activation = LayerActivation(get_ith_layer(model, 5), 'cuda')
	>>> model(torch.rand((1, 3, 224, 224)))
	>>> layer_activation.input
	tensor([[...]])
	>>> layer_activation.output
	tensor([[...]])
	>>> layer_activation.remove()
	"""
	def __init__(self, layer: torch.nn.Module):
	"""Register forward hook on corresponding layer.

	Args:
	layer (torch.nn.Module): Target layer.
	device (str): Where the collected data is located.
	"""
	assert layer is not None

	self.hook = layer.register_forward_hook(self._hook_fn)
	self.input: torch.Tensor = None
	self.output: torch.Tensor = None
	self.layer = layer

	def __str__(self):
	return '- ' + str(self.layer)

	def _hook_fn(self, module, input, output):
	self.input = input
	self.output = output

	def remove(self):
	"""Remove the hook in the model to avoid performance effect.
	Use this after using the collected data.
	"""
	self.hook.remove()

	class LayerActivation3:
	"""Collect the input and output of a middle module of a PyTorch model during inference.

	Layer is a wide concept in this class. A module (e.g. ResBlock in ResNet) can be also regarded as a "layer".

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> # collect the input and output of 5th layer in VGG16
	>>> layer_activation = LayerActivation(get_ith_layer(model, 5), 'cuda')
	>>> model(torch.rand((1, 3, 224, 224)))
	>>> layer_activation.input
	tensor([[...]])
	>>> layer_activation.output
	tensor([[...]])
	>>> layer_activation.remove()
	"""
	def __init__(self, layer: torch.nn.Module, detach: bool, device: str):
	"""Register forward hook on corresponding layer.

	Args:
	layer (torch.nn.Module): Target layer.
	device (str): Where the collected data is located.
	"""
	self.hook = layer.register_forward_hook(self._hook_fn)
	self.detach = detach
	self.device = device
	self.input: torch.Tensor = None
	self.output: torch.Tensor = None
	self.layer = layer

	def __str__(self):
	return '- ' + str(self.layer)

	def _hook_fn(self, module, input, output):
	# TODO: input or output may be a tuple
	self.input = input
	self.output = output

	# if self.detach:
	# self.input = self.input.detach()
	# self.output = self.output.detach()

	def remove(self):
	"""Remove the hook in the model to avoid performance effect.
	Use this after using the collected data.
	"""
	self.hook.remove()

	class LayerActivationWrapper:
	"""A wrapper of :attr:`LayerActivation` which has the same API, but broaden the concept "layer".
	Now a series of layers can be regarded as "hyper-layer" in this class.

	Example:
	>>> from torchvision.models import vgg16
	>>> model = vgg16()
	>>> # collect the input of 5th layer, and output of 7th layer in VGG16
	>>> # i.e. regard 5th~7th layer as a whole module,
	>>> # and collect the input and output of this module
	>>> layer_activation = LayerActivationWrapper([
	LayerActivation(get_ith_layer(model, 5), 'cuda'),
	LayerActivation(get_ith_layer(model, 6), 'cuda')
	LayerActivation(get_ith_layer(model, 7), 'cuda')
	])
	>>> model(torch.rand((1, 3, 224, 224)))
	>>> layer_activation.input
	tensor([[...]])
	>>> layer_activation.output
	tensor([[...]])
	>>> layer_activation.remove()
	"""
	def __init__(self, las: List[LayerActivation]):
	"""
	Args:
	las (List[LayerActivation]): The layer activations of a series of layers.
	"""
	self.las = las

	def __str__(self):
	return '\n'.join([str(la) for la in self.las])

	@property
	def input(self):
	"""Get the collected input data of first layer.

	Returns:
	torch.Tensor: Collected input data of first layer.
	"""
	return self.las[0].input

	@property
	def output(self):
	"""Get the collected input data of last layer.

	Returns:
	torch.Tensor: Collected input data of last layer.
	"""
	return self.las[-1].output

	def remove(self):
	"""Remove all hooks in the model to avoid performance effect.
	Use this after using the collected data.
	"""
	[la.remove() for la in self.las]


	class TimeProfiler:
	""" (NOT VERIFIED. DON'T USE ME)
	"""
	def __init__(self, layer: torch.nn, device):
	self.before_infer_hook = layer.register_forward_pre_hook(self.before_hook_fn)
	self.after_infer_hook = layer.register_forward_hook(self.after_hook_fn)

	self.device = device
	self.infer_time = None
	self._start_time = None

	if self.device != 'cpu':
	self.s, self.e = torch.cuda.Event(enable_timing=True), torch.cuda.Event(enable_timing=True)

	def before_hook_fn(self, module, input):
	if self.device == 'cpu':
	self._start_time = time.time()
	else:
	self.s.record()

	def after_hook_fn(self, module, input, output):
	if self.device == 'cpu':
	self.infer_time = time.time() - self._start_time
	else:
	self.e.record()
	torch.cuda.synchronize()
	self.infer_time = self.s.elapsed_time(self.e) / 1000.

	def remove(self):
	self.before_infer_hook.remove()
	self.after_infer_hook.remove()


	class TimeProfilerWrapper:
	""" (NOT VERIFIED. DON'T USE ME)
	"""
	def __init__(self, tps: List[TimeProfiler]):
	self.tps = tps

	@property
	def infer_time(self):
	return sum([tp.infer_time for tp in self.tps])

	def remove(self):
	[tp.remove() for tp in self.tps]