per-tensor quantize/dequantize benchmarking Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/29506 Test Plan: Imported from OSS Differential Revision: D18415017 Pulled By: z-a-f fbshipit-source-id: 92a50706aafabdcaa79dd1f226f7f4ac63606c74

commit: 5b43becfc5159668c2a46352f8f7b36b31719682 [log] [tgz]
author: Zafar Takhirov <cc.rafaz@zafar.cc> Mon Nov 11 13:14:56 2019 -0800
committer: Facebook Github Bot <facebook-github-bot@users.noreply.github.com> Mon Nov 11 13:19:46 2019 -0800
tree: 7fb090f35ae252498f7274e39697582c0076d771
parent: c49b324cbf17272d02f3811f517fe82106ce77d4 [diff]
diff --git a/benchmarks/operator_benchmark/pt/quantization_test.py b/benchmarks/operator_benchmark/pt/quantization_test.py
new file mode 100644
index 0000000..4f3b7d9
--- /dev/null
+++ b/benchmarks/operator_benchmark/pt/quantization_test.py

@@ -0,0 +1,56 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+from __future__ import unicode_literals
+
+
+import operator_benchmark as op_bench
+import torch
+import torch.nn.quantized as nnq
+
+
+"""Microbenchmarks for general quantization operations."""
+
+quantize_configs_short = op_bench.config_list(
+    # mode is used to show the direction of the benchmark:
+    # if 'Q', benchmark quantization, else dequantization
+    attr_names=['C', 'M', 'N', 'dtype', 'mode'],
+    attrs=[
+        [3, 512, 512, torch.quint8, 'Q'],
+        [3, 512, 512, torch.quint8, 'D'],
+    ],
+    tags=['short']
+)
+
+quantize_configs_long = op_bench.cross_product_configs(
+    C=[1, 3, 8],
+    M=[256, 1024],
+    N=[256, 1024],
+    dtype=[torch.quint8, torch.qint8, torch.qint32],
+    mode=['D', 'Q'],
+    tags=['long']
+)
+
+r"""Benchmarks both quantization and dequantization."""
+class QuantizePerTensorBenchmark(op_bench.TorchBenchmarkBase):
+    def init(self, C, M, N, dtype, mode):
+        assert(mode in ('Q', 'D'))
+        self.input = torch.rand(C, M, N)
+        self.dtype = dtype
+        self.op = nnq.Quantize(scale=1.0, zero_point=0, dtype=dtype)
+        self.set_module_name('quantize_per_tensor')
+
+        if mode == 'D':
+            self.input = self.op(self.input)
+            self.op = nnq.DeQuantize()
+            self.set_module_name('dequantize_per_tensor')
+
+    def forward(self):
+        return self.op(self.input)
+
+
+op_bench.generate_pt_test(quantize_configs_short + quantize_configs_long,
+                          QuantizePerTensorBenchmark)
+
+if __name__ == "__main__":
+    op_bench.benchmark_runner.main()
commit	5b43becfc5159668c2a46352f8f7b36b31719682	[log] [tgz]
author	Zafar Takhirov <cc.rafaz@zafar.cc>	Mon Nov 11 13:14:56 2019 -0800
committer	Facebook Github Bot <facebook-github-bot@users.noreply.github.com>	Mon Nov 11 13:19:46 2019 -0800
tree	7fb090f35ae252498f7274e39697582c0076d771
parent	c49b324cbf17272d02f3811f517fe82106ce77d4 [diff]