tinynn/prune/base

import collections import typing from abc import ABC, abstractmethod from inspect import getsource from pprint import pformat import torch import torch.distributed as dist import torch.nn as nn from torch.nn.parallel.data_parallel import DataParallel from torch.nn.parallel.distributed import DistributedDataParallel from tinynn.graph.modifier import is_dw_conv from tinynn.graph.tracer import TraceGraph, trace from tinynn.util.train_util import DLContext, get_module_device from tinynn.util.util import conditional, get_actual_type, get_logger try: import ruamel_yaml as yaml except ModuleNotFoundError: import ruamel.yaml as yaml NEW_YAML_FLAG = "error_deprecation" in getsource(yaml.load) log = get_logger(__name__) class BasePruner(ABC): required_params = () required_context_params = () default_values = {} context_from_params_dict = {} condition_dict = {} model: nn.Module dummy_input: torch.Tensor config: typing.Union[dict, collections.OrderedDict] graph: TraceGraph context: DLContext def __init__(self, model, dummy_input, config): self.model = model self.config = config self.dummy_input = dummy_input self.graph = self.trace() @abstractmethod def prune(self): """The main function for pruning""" pass @abstractmethod def register_mask(self): """Computes the mask for the parameters in the model and register them through the maskers""" pass @abstractmethod def apply_mask(self): """Applies the masks for the parameters and updates the shape and properties of the tensors and modules""" pass def parse_config(self): """Parses the config and init the parameters of the pruner""" if isinstance(self.config, str): self.config = self.load_config(self.config) if not isinstance(self.config, dict): raise Exception('The `config` argument requires a parsed json object (e.g. dict or OrderedDict)') missing_params = set(self.required_params) - set(self.config) if len(missing_params) != 0: missing_params_str = ', '.join(missing_params) raise Exception(f'Missing param {missing_params_str} for {type(self).__name__}') for param_key, default_value in self.default_values.items(): if param_key not in self.config: self.config[param_key] = default_value type_dict = {} for cls in reversed(type(self).__mro__): if hasattr(cls, '__annotations__') and cls != BasePruner: type_dict.update(cls.__annotations__) for param_key, param_type in type_dict.items(): if param_key not in self.config: continue type_expected = False param_types = get_actual_type(param_type) for type_cand in param_types: if isinstance(self.config[param_key], type_cand): type_expected = True break if not type_expected: raise Exception(f'The type of `{param_key}` in {type(self).__name__} should be {param_type}') for param_key, predicate in self.condition_dict.items(): if predicate(self.config[param_key]) is False: raise Exception(f'The value of `{param_key}` doesn\'t meet the requirement: {getsource(predicate)}') def parse_context(self, context: DLContext): """Parses the context and copy the needed items to the pruner""" for context_key, param_keys in self.context_from_params_dict.items(): for param_key in param_keys: if param_key in self.config: setattr(context, context_key, self.config[param_key]) break filtered_context = dict(filter(lambda x: x[1], context.__dict__.items())) missing_context_items = list(set(self.required_context_params) - set(filtered_context)) if len(missing_context_items) != 0: missing_context_items_str = ', '.join(missing_context_items) raise Exception(f'Missing context items {missing_context_items_str} for {type(self).__name__}') self.context = context def summary(self): """Dumps the parameters and possibly the related context items of the pruner""" if len(self.required_params) > 0: log.info('-' * 80) log.info(f'params ({type(self).__name__}):') for k, v in self.__dict__.items(): if k in self.required_params or k in self.default_values: log.info(f'{k}: {pformat(v)}') if len(self.required_context_params) > 0: log.info('-' * 80) log.info(f'context ({type(self).__name__}):') log.info('\n'.join((f'{k}: {pformat(v)}' for k, v in self.context.__dict__.items()))) @classmethod def load_config(cls, path: str) -> dict: """Loads the configuration file and returns it as a dictionary""" with open(path, 'r') as f: if NEW_YAML_FLAG: yaml_ = yaml.YAML(typ='rt') config = yaml_.load(f) else: config = yaml.load(f, Loader=yaml.RoundTripLoader) return config @conditional(lambda: not dist.is_available() or not dist.is_initialized() or dist.get_rank() == 0) def generate_config(self, path: str, config: dict = None) -> None: """Generates a new copy the updated configuration with the given path""" if config is None: config = self.config with open(path, 'w') as f: if NEW_YAML_FLAG: yaml_ = yaml.YAML(typ='rt') yaml_.default_flow_style = False yaml_.dump(config, f) else: yaml.dump(config, f, default_flow_style=False, Dumper=yaml.RoundTripDumper) def trace(self) -> TraceGraph: with torch.no_grad(): if isinstance(self.model, DataParallel) or isinstance(self.model, DistributedDataParallel): model = self.model.module else: model = self.model old_device = get_module_device(model) model.cpu() graph = trace(model, self.dummy_input) if old_device is not None: model.to(device=old_device) return graph def reset(self): """Regenerate the TraceGraph when it is invalidated""" self.graph = self.trace() def calc_flops(self) -> int: """Calculate the flops of the given model""" # If graph is invalidated, then we need to regenerate the graph if not self.graph.inited: self.reset() graph: TraceGraph = self.graph total_ops = 0 for node in graph.forward_nodes: m = node.module remove_in_channel_count = 0 remove_out_channel_count = 0 if hasattr(m, 'masker'): if m.masker.in_remove_idx is not None: remove_in_channel_count = len(m.masker.in_remove_idx) if m.masker.ot_remove_idx is not None: remove_out_channel_count = len(m.masker.ot_remove_idx) if type(m) in (nn.Conv2d, nn.ConvTranspose2d): kernel_ops = torch.zeros(m.weight.size()[2:]).numel() bias_ops = 1 if m.bias is not None else 0 in_channels = m.in_channels - remove_in_channel_count out_channels = m.out_channels - remove_out_channel_count out_elements = node.next_tensors[0].nelement() // m.out_channels * out_channels if is_dw_conv(m): groups = in_channels else: groups = m.groups total_ops += out_elements * (in_channels // groups * kernel_ops + bias_ops) elif type(m) in (nn.BatchNorm2d,): channels = m.num_features - remove_in_channel_count nelements = node.prev_tensors[0].numel() // m.num_features * channels total_ops += 2 * nelements elif type(m) in (nn.AvgPool2d, nn.AdaptiveAvgPool2d): channels = node.prev_tensors[0].size(1) - remove_in_channel_count kernel_ops = 1 num_elements = node.prev_tensors[0].numel() // node.prev_tensors[0].size(1) * channels total_ops += kernel_ops * num_elements elif type(m) in (nn.ReLU,): channels = node.prev_tensors[0].size(1) - remove_in_channel_count kernel_ops = 1 num_elements = node.prev_tensors[0].numel() // node.prev_tensors[0].size(1) * channels total_ops += kernel_ops * num_elements elif type(m) in (nn.Linear,): in_channels = m.in_features - remove_in_channel_count out_channels = m.out_features - remove_out_channel_count total_mul = in_channels num_elements = node.next_tensors[0].numel() // m.out_features * out_channels total_ops += total_mul * num_elements return total_ops

tinynn/prune/base_pruner.py (178 lines of code) (raw):