[Vulkan] Enable QInt8 and QInt32 quantization (#89788)

manuelcandales · pytorchmergebot · commit 49ccc41d57a9 · 2022-12-06T06:27:40.000Z
Summary: Enabled Vulkan quantization for dtypes QInt8 and QInt32 Test Plan: On Mac ``` cd ~/fbsource buck1 run -c pt.vulkan_full_precision=1 //xplat/caffe2:pt_vulkan_quantized_api_test_binAppleMac\#macosx-arm64 ``` On Android ``` cd ~/fbsource buck1 build -c ndk.custom_libcxx=false -c pt.enable_qpl=0 -c pt.vulkan_full_precision=1 //xplat/caffe2:pt_vulkan_quantized_api_test_binAndroid\#android-arm64 --show-output adb push buck-out/gen/xplat/caffe2/pt_vulkan_quantized_api_test_binAndroid\#android-arm64 /data/local/tmp/vulkan_quantized_api_test adb shell "/data/local/tmp/vulkan_quantized_api_test" ``` Differential Revision: D41561661 Pull Request resolved: #89788 Approved by: https://github.com/digantdesai
diff --git a/aten/src/ATen/native/vulkan/api/Resource.cpp b/aten/src/ATen/native/vulkan/api/Resource.cpp
@@ -36,6 +36,10 @@ VkFormat vk_format(const at::ScalarType dtype) {
 #endif /* USE_VULKAN_FP16_INFERENCE */
     case c10::kQUInt8:
       return VK_FORMAT_R8G8B8A8_UINT;
+    case c10::kQInt8:
+      return VK_FORMAT_R8G8B8A8_SINT;
+    case c10::kQInt32:
+      return VK_FORMAT_R32G32B32A32_SINT;
 
     default:
       TORCH_CHECK(
diff --git a/aten/src/ATen/native/vulkan/glsl/quantize_per_tensor_qint32.glsl b/aten/src/ATen/native/vulkan/glsl/quantize_per_tensor_qint32.glsl
@@ -0,0 +1,31 @@
+#version 450 core
+#define PRECISION $precision
+#define FORMAT    $format
+
+layout(std430) buffer;
+
+/* Qualifiers: layout - storage - precision - memory */
+
+layout(set = 0, binding = 0, rgba32i) uniform PRECISION restrict writeonly iimage3D   uOutput;
+layout(set = 0, binding = 1)          uniform PRECISION                    sampler3D  uInput; //input
+layout(set = 0, binding = 2)          uniform PRECISION restrict           Block {
+  ivec4 size;
+  vec2 scale;
+  ivec2 zero_point;
+} uBlock;
+
+layout(local_size_x_id = 0, local_size_y_id = 1, local_size_z_id = 2) in;
+
+void main() {
+  const ivec3 pos = ivec3(gl_GlobalInvocationID);
+  if (all(lessThan(pos, uBlock.size.xyz))) {
+    vec4 q_res = roundEven(texelFetch(uInput, pos, 0) / uBlock.scale.x) + uBlock.zero_point.x;
+
+    ivec4 ret = ivec4(q_res);
+
+    imageStore(
+        uOutput,
+        pos,
+        ret);
+  }
+}
diff --git a/aten/src/ATen/native/vulkan/glsl/quantize_per_tensor_qint8.glsl b/aten/src/ATen/native/vulkan/glsl/quantize_per_tensor_qint8.glsl
@@ -0,0 +1,31 @@
+#version 450 core
+#define PRECISION $precision
+#define FORMAT    $format
+
+layout(std430) buffer;
+
+/* Qualifiers: layout - storage - precision - memory */
+
+layout(set = 0, binding = 0, rgba8i) uniform PRECISION restrict writeonly iimage3D   uOutput;
+layout(set = 0, binding = 1)         uniform PRECISION                    sampler3D  uInput; //input
+layout(set = 0, binding = 2)         uniform PRECISION restrict           Block {
+  ivec4 size;
+  vec2 scale;
+  ivec2 zero_point;
+} uBlock;
+
+layout(local_size_x_id = 0, local_size_y_id = 1, local_size_z_id = 2) in;
+
+void main() {
+  const ivec3 pos = ivec3(gl_GlobalInvocationID);
+  if (all(lessThan(pos, uBlock.size.xyz))) {
+    vec4 q_res = roundEven(texelFetch(uInput, pos, 0) / uBlock.scale.x) + uBlock.zero_point.x;
+
+    ivec4 ret = ivec4(q_res);
+
+    imageStore(
+        uOutput,
+        pos,
+        ret);
+  }
+}
diff --git a/aten/src/ATen/native/vulkan/glsl/quantize_per_tensor_quint8.glsl b/aten/src/ATen/native/vulkan/glsl/quantize_per_tensor_quint8.glsl
diff --git a/aten/src/ATen/native/vulkan/ops/Copy.cpp b/aten/src/ATen/native/vulkan/ops/Copy.cpp
@@ -18,10 +18,15 @@ void memcpy_to_mapping(const Tensor& src, api::MemoryMap& dst_mapping) {
     memcpy_to_mapping_impl<c10::Half>(src, dst_mapping);
   } else if (src.dtype() == c10::kQUInt8) {
     memcpy_to_mapping_impl<c10::quint8>(src, dst_mapping);
+  } else if (src.dtype() == c10::kQInt8) {
+    memcpy_to_mapping_impl<c10::qint8>(src, dst_mapping);
+  } else if (src.dtype() == c10::kQInt32) {
+    memcpy_to_mapping_impl<c10::qint32>(src, dst_mapping);
   } else {
     TORCH_CHECK(
         false,
-        "Invalid Data Type: expected c10::QUint8, at::kHalf or at::Float but got ",
+        "Invalid Data Type: expected c10::kQInt32, c10::kQInt8, c10::kQUInt8,",
+        " at::kHalf or at::Float but got ",
         src.dtype());
   }
 }
@@ -33,10 +38,15 @@ void memcpy_from_mapping(api::MemoryMap& src_mapping, Tensor& dst) {
     memcpy_from_mapping_impl<c10::Half>(src_mapping, dst);
   } else if (dst.dtype() == c10::kQUInt8) {
     memcpy_from_mapping_impl<c10::quint8>(src_mapping, dst);
+  } else if (dst.dtype() == c10::kQInt8) {
+    memcpy_from_mapping_impl<c10::qint8>(src_mapping, dst);
+  } else if (dst.dtype() == c10::kQInt32) {
+    memcpy_from_mapping_impl<c10::qint32>(src_mapping, dst);
   } else {
     TORCH_CHECK(
         false,
-        "Invalid Data Type: expected c10::QUint8, at::kHalf or Float but got ",
+        "Invalid Data Type: expected c10::kQInt32, c10::kQInt8, c10::kQUInt8,",
+        " at::kHalf or at::Float but got ",
         dst.dtype());
   }
 }
diff --git a/aten/src/ATen/native/vulkan/ops/QuantizedTensor.cpp b/aten/src/ATen/native/vulkan/ops/QuantizedTensor.cpp
@@ -10,24 +10,37 @@ namespace ops {
 
 using namespace api::utils;
 
+static api::ShaderSource get_quantize_per_tensor_shader(
+    const c10::ScalarType dtype) {
+  switch (dtype) {
+    case c10::ScalarType::QUInt8:
+      return VK_KERNEL(quantize_per_tensor_quint8);
+    case c10::ScalarType::QInt8:
+      return VK_KERNEL(quantize_per_tensor_qint8);
+    case c10::ScalarType::QInt32:
+      return VK_KERNEL(quantize_per_tensor_qint32);
+    default:
+      TORCH_CHECK(
+          false,
+          "Vulkan quantization currently not supported for dtype ",
+          dtype);
+  }
+}
+
 Tensor quantize_per_tensor(
     const at::Tensor& input_arg,
     const double scale,
     const int64_t zero_point,
     const c10::ScalarType dtype) {
-  TORCH_CHECK(dtype == c10::ScalarType::QUInt8, "Expected type c10::kQUint8");
+  api::ShaderSource compute_shader = get_quantize_per_tensor_shader(dtype);
 
   api::Context* const context = api::context();
 
   const Tensor input = input_arg.is_vulkan() ? input_arg : input_arg.vulkan();
   const vTensor& v_input = convert(input);
 
   vTensor v_output{
-      context,
-      input.sizes(),
-      input.options().dtype(c10::kQUInt8),
-      scale,
-      zero_point};
+      context, input.sizes(), input.options().dtype(dtype), scale, zero_point};
 
   const struct Block final {
     uvec3 extents;
@@ -50,7 +63,7 @@ Tensor quantize_per_tensor(
 
   context->submit_compute_job(
       // shader descriptor
-      VK_KERNEL(quantize_per_tensor),
+      compute_shader,
       // barrier
       pipeline_barrier,
       // global work group size
diff --git a/aten/src/ATen/test/vulkan_quantized_api_test.cpp b/aten/src/ATen/test/vulkan_quantized_api_test.cpp
@@ -449,66 +449,123 @@ void test_quantize_per_tensor_and_dequantize(
     const at::IntArrayRef input_shape,
     const double input_scale,
     const int input_zero_point,
-    const float tolerance = 0) {
-  at::Tensor input = at::rand(input_shape, at::device(at::kCPU).dtype(at::kFloat));
+    const c10::ScalarType dtype = c10::ScalarType::QUInt8) {
+  at::Tensor input = produce_random_tensor(input_shape);
 
   // quantize tensors
   at::Tensor out_q_cpu = at::quantize_per_tensor(
-    input, input_scale, input_zero_point, c10::ScalarType::QUInt8);
+    input, input_scale, input_zero_point, dtype);
   at::Tensor out_q_vk = at::quantize_per_tensor(
-    input.vulkan(), input_scale, input_zero_point, c10::ScalarType::QUInt8);
+    input.vulkan(), input_scale, input_zero_point, dtype);
 
   // dequantize tensors
   const auto out_cpu_deq = at::dequantize(out_q_cpu);
   const auto out_vk_deq = at::dequantize(out_q_vk);
+  const auto out_vk_deq_cpu = out_vk_deq.cpu();
 
   // check dequantized tensor are equal
-  const auto check = almostEqual(out_cpu_deq, out_vk_deq.cpu(), tolerance);
+  const float tolerance = input_scale;
+  // tolerated error = scale, to allow for precision differences after dividing
+  // by random scale, which could result on a difference of 1 unit in the
+  // quantized result.
+  const auto check = almostEqual(out_cpu_deq, out_vk_deq_cpu, tolerance);
 
   if (!check) {
+    const auto error = at::abs(out_vk_deq_cpu - out_cpu_deq).max().item<float>();
     std::cout
       << "Quantize and Dequantize failed with input shape: " << input_shape
       << " scale: " << input_scale << " and zero point: " << input_zero_point
     << std::endl;
+    std::cout << "Error: " << error << std::endl;
   }
   ASSERT_TRUE(check);
 }
 
-void test_quantize_per_tensor_and_dequantize_random() {
-  const double scale = 0.0001 + (double)rand() / (double)RAND_MAX;
-  const int zero_point = int((double)rand() / (double)RAND_MAX * 255);
-  const int n = 1 + int((double)rand() / (double)RAND_MAX * 30);
-  const int c = 1 + int((double)rand() / (double)RAND_MAX * 30);
-  const int h = 1 + int((double)rand() / (double)RAND_MAX * 100);
-  const int w = 1 + int((double)rand() / (double)RAND_MAX * 100);
-  // tolerated error = scale, to allow for precision differences after dividing
-  // by random scale, which could result on a difference of 1 unit in the
-  // quantized result.
-  test_quantize_per_tensor_and_dequantize({n, c, h, w}, scale, zero_point, scale);
+void test_quantize_per_tensor_and_dequantize_random(
+    const c10::ScalarType dtype) {
+  const double scale = produce_random_scale();
+  const int64_t zero_point = produce_random_zero_point(dtype);
+  const at::IntArrayRef tensor_shape =
+    {rand_pos_int(30), rand_pos_int(30), rand_pos_int(100), rand_pos_int(100)};
+  test_quantize_per_tensor_and_dequantize(
+    tensor_shape, scale, zero_point, dtype);
+}
+
+TEST_F(VulkanAPITest, quantize_per_tensor_and_dequantize_quint8) {
+  const c10::ScalarType dtype = c10::ScalarType::QUInt8;
+  test_quantize_per_tensor_and_dequantize({1, 1, 1, 1}, 0.13, 21, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 1, 4}, 0.3, 87, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 4, 1}, 0.2, 120, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 7, 7}, 0.3, 87, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 8, 8}, 0.1, 10, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 8, 8}, 0.04, 97, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 11, 17}, 0.07, 15, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 12, 17}, 0.1, 10, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 12, 17}, 0.1, 10, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 17, 12}, 0.1, 10, dtype);
+  test_quantize_per_tensor_and_dequantize({2, 4, 17, 12}, 0.1, 10, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 10, 14}, 0.001, 101, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 10, 14}, 0.009, 43, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 10, 15}, 0.1, 19, dtype);
+  test_quantize_per_tensor_and_dequantize({4, 4, 9, 17}, 0.1, 19, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 25, 29}, 0.1, 19, dtype);
+  test_quantize_per_tensor_and_dequantize({4, 4, 25, 29}, 0.1, 19, dtype);
+  test_quantize_per_tensor_and_dequantize({11, 17, 25, 29}, 0.027, 89, dtype);
+
+  for (int i = 0; i < 20; i += 1) {
+    test_quantize_per_tensor_and_dequantize_random(dtype);
+  }
+}
+
+TEST_F(VulkanAPITest, quantize_per_tensor_and_dequantize_qint8) {
+  const c10::ScalarType dtype = c10::ScalarType::QInt8;
+  test_quantize_per_tensor_and_dequantize({1, 1, 1, 1}, 0.13, -21, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 1, 4}, 0.3, 87, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 4, 1}, 0.2, -120, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 7, 7}, 0.3, 87, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 8, 8}, 0.1, -10, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 8, 8}, 0.04, 97, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 11, 17}, 0.07, -15, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 12, 17}, 0.1, 10, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 12, 17}, 0.1, -10, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 17, 12}, 0.1, 10, dtype);
+  test_quantize_per_tensor_and_dequantize({2, 4, 17, 12}, 0.1, -10, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 10, 14}, 0.001, 101, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 10, 14}, 0.009, -43, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 10, 15}, 0.1, 19, dtype);
+  test_quantize_per_tensor_and_dequantize({4, 4, 9, 17}, 0.1, -19, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 25, 29}, 0.1, 19, dtype);
+  test_quantize_per_tensor_and_dequantize({4, 4, 25, 29}, 0.1, -19, dtype);
+  test_quantize_per_tensor_and_dequantize({11, 17, 25, 29}, 0.027, 89, dtype);
+
+  for (int i = 0; i < 20; i += 1) {
+    test_quantize_per_tensor_and_dequantize_random(dtype);
+  }
 }
 
-TEST_F(VulkanAPITest, quantize_per_tensor_and_dequantize) {
-  test_quantize_per_tensor_and_dequantize({1, 1, 1, 1}, 0.13, 21);
-  test_quantize_per_tensor_and_dequantize({1, 1, 1, 4}, 0.3, 87);
-  test_quantize_per_tensor_and_dequantize({1, 1, 4, 1}, 0.2, 120);
-  test_quantize_per_tensor_and_dequantize({1, 1, 7, 7}, 0.3, 87);
-  test_quantize_per_tensor_and_dequantize({1, 1, 8, 8}, 0.1, 10);
-  test_quantize_per_tensor_and_dequantize({3, 5, 8, 8}, 0.04, 97);
-  test_quantize_per_tensor_and_dequantize({1, 1, 11, 17}, 0.07, 15);
-  test_quantize_per_tensor_and_dequantize({1, 1, 12, 17}, 0.1, 10);
-  test_quantize_per_tensor_and_dequantize({3, 5, 12, 17}, 0.1, 10);
-  test_quantize_per_tensor_and_dequantize({1, 1, 17, 12}, 0.1, 10);
-  test_quantize_per_tensor_and_dequantize({2, 4, 17, 12}, 0.1, 10);
-  test_quantize_per_tensor_and_dequantize({1, 1, 10, 14}, 0.0001, 101);
-  test_quantize_per_tensor_and_dequantize({3, 5, 10, 14}, 0.009, 43);
-  test_quantize_per_tensor_and_dequantize({3, 5, 10, 15}, 0.1, 19);
-  test_quantize_per_tensor_and_dequantize({4, 4, 9, 17}, 0.1, 19);
-  test_quantize_per_tensor_and_dequantize({3, 5, 25, 29}, 0.1, 19);
-  test_quantize_per_tensor_and_dequantize({4, 4, 25, 29}, 0.1, 19);
-  test_quantize_per_tensor_and_dequantize({11, 17, 25, 29}, 0.027, 89);
+TEST_F(VulkanAPITest, quantize_per_tensor_and_dequantize_qint32) {
+  const c10::ScalarType dtype = c10::ScalarType::QInt32;
+  test_quantize_per_tensor_and_dequantize({1, 1, 1, 1}, 0.13, -21123, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 1, 4}, 0.339, 8734, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 4, 1}, 0.228, -12023, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 7, 7}, 0.338, 8723, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 8, 8}, 0.193, -1023, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 8, 8}, 0.0449, 972, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 11, 17}, 0.073, -15, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 12, 17}, 0.1572, 102, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 12, 17}, 0.147, -156, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 17, 12}, 0.129, 10448, dtype);
+  test_quantize_per_tensor_and_dequantize({2, 4, 17, 12}, 0.137, -10, dtype);
+  test_quantize_per_tensor_and_dequantize({1, 1, 10, 14}, 0.001, 101, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 10, 14}, 0.009, -43267, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 10, 15}, 0.1243, 19, dtype);
+  test_quantize_per_tensor_and_dequantize({4, 4, 9, 17}, 0.1889, -19784, dtype);
+  test_quantize_per_tensor_and_dequantize({3, 5, 25, 29}, 0.1345, 196, dtype);
+  test_quantize_per_tensor_and_dequantize({4, 4, 25, 29}, 0.129, -19489, dtype);
+  test_quantize_per_tensor_and_dequantize({11, 17, 25, 29}, 0.027, 89, dtype);
 
   for (int i = 0; i < 20; i += 1) {
-    test_quantize_per_tensor_and_dequantize_random();
+    test_quantize_per_tensor_and_dequantize_random(dtype);
   }
 }