Update on "add quantized layer norm implementation"

vkuzo · vkuzo · commit 24c2bf57d849 · 2020-03-24T16:50:44.000-07:00
Summary: Adds a quantized implementation of LayerNorm for server. Relevant PRs: * #20345 (floating point LN) * #33080 (quantized BN) A future PR will add the Python wrapper. Test Plan: numerics match the floating point implementation TODO: benchmarks Reviewers: Subscribers: Tasks: Tags: [ghstack-poisoned]
diff --git a/benchmarks/operator_benchmark/benchmark_all_quantized_test.py b/benchmarks/operator_benchmark/benchmark_all_quantized_test.py
@@ -11,6 +11,7 @@
     qcomparators_test,
     qconv_test,
     qinterpolate_test,
+    qlayernorm_test,
     qlinear_test,
     qobserver_test,
     qpool_test,
diff --git a/benchmarks/operator_benchmark/pt/qlayernorm_test.py b/benchmarks/operator_benchmark/pt/qlayernorm_test.py
@@ -0,0 +1,50 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+from __future__ import unicode_literals
+
+
+import operator_benchmark as op_bench
+import torch
+
+
+"""Microbenchmarks for quantized layernorm operator."""
+
+layernorm_configs_long = op_bench.cross_product_configs(
+    dims=(
+        (64, 224, 224),
+        (128, 112, 112),
+        (256, 56, 56),
+    ),
+    dtype=(torch.qint8,),
+    tags=["short"],
+)
+
+
+class LayerNormBenchmark(op_bench.TorchBenchmarkBase):
+    def init(self, dims, dtype):
+        print(dims, dtype)
+
+        X = (torch.rand(*dims) - 0.5) * 256
+        scale = 1.0
+        zero_point = 0
+        self.qX = torch.quantize_per_tensor(
+            X, scale=scale, zero_point=zero_point, dtype=dtype)
+        self.weight = torch.rand(*self.qX.size()[1:], dtype=torch.float)
+        self.bias = torch.rand(*self.qX.size()[1:], dtype=torch.float)
+        self.eps = 1e-5
+        self.Y_scale = 0.1
+        self.Y_zero_point = 0
+
+    def forward(self):
+        return torch.ops.quantized.layer_norm(
+            self.qX, self.qX.size()[1:], weight=self.weight, bias=self.bias,
+            eps=self.eps, output_scale=self.Y_scale,
+            output_zero_point=self.Y_zero_point)
+
+
+op_bench.generate_pt_test(layernorm_configs_long, LayerNormBenchmark)
+
+
+if __name__ == "__main__":
+    op_bench.benchmark_runner.main()