in optimum/quanto/nn/qmodule.py [0:0]
def _save_to_state_dict(self, destination, prefix, keep_vars):
if self.weight_qtype is None or not self.frozen:
# Save standard weight Tensor
destination[prefix + "weight"] = (
self.weight if (self.weight is None or keep_vars) else self.weight.detach()
)
else:
# Save QTensor using dedicated method
self.weight.save_to_state_dict(destination, prefix + "weight.", keep_vars)
if self.bias is not None:
destination[prefix + "bias"] = self.bias if keep_vars else self.bias.detach()
destination[prefix + "input_scale"] = self.input_scale if keep_vars else self.input_scale.detach()
destination[prefix + "output_scale"] = self.output_scale if keep_vars else self.output_scale.detach()