torch/quantization/fake_quantize.py - platform/external/pytorch - Git at Google

 from __future__ import absolute_import, division, print_function, unicode_literals
 import torch
 from torch.nn import Module
 from .observer import default_observer
 from functools import partial

 class FakeQuantize(Module):
     ''' Simulate the quantize and dequantize operations in training time.
     Args:
         `qconfig`: object that encodes configuration info for quantization
         `observer_module`: Observer module that records stats of weights and
         activations
         `calcqparam`: A function that calculates quantization parameters
         given the stats
     '''

     def __init__(self, dtype=torch.quint8, qscheme=torch.per_tensor_affine,
                  quant_min=0, quant_max=255):
         super(FakeQuantize, self).__init__()
         assert torch.iinfo(dtype).min <= quant_min, 'quant_min out of bound'
         assert quant_min <= quant_max, \
             'quant_min must be less than or equal to quant_max'
         assert quant_max <= torch.iinfo(dtype).max, 'quant_max out of bound'
         self.dtype = dtype
         self.qscheme = qscheme
         self.quant_min = quant_min
         self.quant_max = quant_max
         self.enabled = True
         self.observer = default_observer(dtype=dtype, qscheme=qscheme)()
         self.scale = None
         self.zero_point = None

     def enable(self, enabled=True):
         self.enabled = enabled
         return self

     def disable(self):
         return self.enable(False)

     def calculate_qparams(self):
         return self.observer.calculate_qparams()

     def forward(self, X):
         if self.enabled:
             self.observer(X)
             self.scale, self.zero_point = self.calculate_qparams()
             X = torch.fake_quantize_per_tensor_affine(
                 X, self.scale.double(), self.zero_point.long(), self.quant_min,
                 self.quant_max)
         return X

 def fake_quant(fake_quant_cls, **kwargs):
     return partial(fake_quant_cls, **kwargs)

 def default_fake_quant(**kwargs):
     return fake_quant(FakeQuantize, **kwargs)

 def default_weight_fake_quant(**kwargs):
     kwargs.setdefault('dtype', torch.qint8)
     kwargs.setdefault('qscheme', torch.per_tensor_symmetric)
     kwargs.setdefault('quant_min', -128)
     kwargs.setdefault('quant_max', 127)
     return fake_quant(FakeQuantize, **kwargs)
	from __future__ import absolute_import, division, print_function, unicode_literals
	import torch
	from torch.nn import Module
	from .observer import default_observer
	from functools import partial

	class FakeQuantize(Module):
	''' Simulate the quantize and dequantize operations in training time.
	Args:
	`qconfig`: object that encodes configuration info for quantization
	`observer_module`: Observer module that records stats of weights and
	activations
	`calcqparam`: A function that calculates quantization parameters
	given the stats
	'''

	def __init__(self, dtype=torch.quint8, qscheme=torch.per_tensor_affine,
	quant_min=0, quant_max=255):
	super(FakeQuantize, self).__init__()
	assert torch.iinfo(dtype).min <= quant_min, 'quant_min out of bound'
	assert quant_min <= quant_max, \
	'quant_min must be less than or equal to quant_max'
	assert quant_max <= torch.iinfo(dtype).max, 'quant_max out of bound'
	self.dtype = dtype
	self.qscheme = qscheme
	self.quant_min = quant_min
	self.quant_max = quant_max
	self.enabled = True
	self.observer = default_observer(dtype=dtype, qscheme=qscheme)()
	self.scale = None
	self.zero_point = None

	def enable(self, enabled=True):
	self.enabled = enabled
	return self

	def disable(self):
	return self.enable(False)

	def calculate_qparams(self):
	return self.observer.calculate_qparams()

	def forward(self, X):
	if self.enabled:
	self.observer(X)
	self.scale, self.zero_point = self.calculate_qparams()
	X = torch.fake_quantize_per_tensor_affine(
	X, self.scale.double(), self.zero_point.long(), self.quant_min,
	self.quant_max)
	return X

	def fake_quant(fake_quant_cls, **kwargs):
	return partial(fake_quant_cls, **kwargs)

	def default_fake_quant(**kwargs):
	return fake_quant(FakeQuantize, **kwargs)

	def default_weight_fake_quant(**kwargs):
	kwargs.setdefault('dtype', torch.qint8)
	kwargs.setdefault('qscheme', torch.per_tensor_symmetric)
	kwargs.setdefault('quant_min', -128)
	kwargs.setdefault('quant_max', 127)
	return fake_quant(FakeQuantize, **kwargs)