pytorch
diff --git a/‎test/quantization/core/test_backend_config.py‎
Lines changed: 14 additions & 14 deletions b/‎test/quantization/core/test_backend_config.py‎
Lines changed: 14 additions & 14 deletions
diff --git a/‎test/quantization/fx/test_quantize_fx.py‎
Lines changed: 15 additions & 9 deletions b/‎test/quantization/fx/test_quantize_fx.py‎
Lines changed: 15 additions & 9 deletions
diff --git a/‎torch/ao/ns/fx/mappings.py‎
Lines changed: 15 additions & 21 deletions b/‎torch/ao/ns/fx/mappings.py‎
Lines changed: 15 additions & 21 deletions
diff --git a/‎torch/ao/quantization/backend_config/README.md‎
Lines changed: 16 additions & 4 deletions b/‎torch/ao/quantization/backend_config/README.md‎
Lines changed: 16 additions & 4 deletions
@@ -13,7 +13,7 @@
     DTypeWithConstraints,
     ObservationType,
 )
-from torch.ao.quantization.fuser_method_mappings import _reverse_sequential_wrapper2
+from torch.ao.quantization.fuser_method_mappings import _sequential_wrapper2
 from torch.ao.quantization.fx.quantize_handler import _default_root_node_getter
 
 
@@ -104,7 +104,7 @@ def test_dtype_config_to_dict(self):
     #  BackendPatternConfig
     # ======================
 
-    _fuser_method = _reverse_sequential_wrapper2(nni.LinearReLU)
+    _fuser_method = _sequential_wrapper2(nni.LinearReLU)
 
     _num_tensor_args_to_observation_type = {
         0: ObservationType.OUTPUT_USE_DIFFERENT_OBSERVER_AS_INPUT,
@@ -121,7 +121,7 @@ def _extra_inputs_getter(self, p):
         return (torch.rand(3, 3),)
 
     def _get_backend_op_config1(self):
-        return BackendPatternConfig((torch.nn.ReLU, torch.nn.Linear)) \
+        return BackendPatternConfig((torch.nn.Linear, torch.nn.ReLU)) \
             .set_observation_type(ObservationType.OUTPUT_USE_DIFFERENT_OBSERVER_AS_INPUT) \
             .add_dtype_config(self.dtype_config1) \
             .add_dtype_config(self.dtype_config2) \
@@ -142,7 +142,7 @@ def _get_backend_op_config2(self):
 
     def _get_backend_pattern_config_dict1(self):
         return {
-            "pattern": (torch.nn.ReLU, torch.nn.Linear),
+            "pattern": (torch.nn.Linear, torch.nn.ReLU),
             "observation_type": ObservationType.OUTPUT_USE_DIFFERENT_OBSERVER_AS_INPUT,
             "dtype_configs": [self.dtype_config_dict1, self.dtype_config_dict2],
             "root_module": torch.nn.Linear,
@@ -198,19 +198,19 @@ def test_backend_op_config_set_reference_quantized_module(self):
         self.assertEqual(conf.reference_quantized_module, nnqr.Linear)
 
     def test_backend_op_config_set_fused_module(self):
-        conf = BackendPatternConfig((torch.nn.ReLU, torch.nn.Linear))
+        conf = BackendPatternConfig((torch.nn.Linear, torch.nn.ReLU))
         self.assertTrue(conf.fused_module is None)
         conf.set_fused_module(nni.LinearReLU)
         self.assertEqual(conf.fused_module, nni.LinearReLU)
 
     def test_backend_op_config_set_fuser_method(self):
-        conf = BackendPatternConfig((torch.nn.ReLU, torch.nn.Linear))
+        conf = BackendPatternConfig((torch.nn.Linear, torch.nn.ReLU))
         self.assertTrue(conf.fuser_method is None)
         conf.set_fuser_method(self._fuser_method)
         self.assertEqual(conf.fuser_method, self._fuser_method)
 
     def test_backend_op_config_set_root_node_getter(self):
-        conf = BackendPatternConfig((torch.nn.ReLU, torch.nn.Linear))
+        conf = BackendPatternConfig((torch.nn.Linear, torch.nn.ReLU))
         self.assertTrue(conf._root_node_getter is None)
         conf._set_root_node_getter(_default_root_node_getter)
         self.assertEqual(conf._root_node_getter, _default_root_node_getter)
@@ -242,7 +242,7 @@ def test_backend_op_config_set_input_output_observed(self):
     def test_backend_op_config_from_dict(self):
         conf_dict1 = self._get_backend_pattern_config_dict1()
         conf1 = BackendPatternConfig.from_dict(conf_dict1)
-        self.assertEqual(conf1.pattern, (torch.nn.ReLU, torch.nn.Linear))
+        self.assertEqual(conf1.pattern, (torch.nn.Linear, torch.nn.ReLU))
         self.assertEqual(conf1.observation_type, ObservationType.OUTPUT_USE_DIFFERENT_OBSERVER_AS_INPUT)
         self.assertEqual(conf1.root_module, torch.nn.Linear)
         self.assertEqual(conf1.qat_module, nnqat.Linear)
@@ -294,11 +294,11 @@ def test_backend_config_set_backend_pattern_config(self):
         backend_op_config1 = self._get_backend_op_config1()
         backend_op_config2 = self._get_backend_op_config2()
         conf.set_backend_pattern_config(backend_op_config1)
-        self.assertEqual(conf.configs, {
+        self.assertEqual(conf._pattern_complex_format_to_config, {
             (torch.nn.ReLU, torch.nn.Linear): backend_op_config1,
         })
         conf.set_backend_pattern_config(backend_op_config2)
-        self.assertEqual(conf.configs, {
+        self.assertEqual(conf._pattern_complex_format_to_config, {
             (torch.nn.ReLU, torch.nn.Linear): backend_op_config1,
             torch.add: backend_op_config2
         })
@@ -317,10 +317,10 @@ def test_backend_config_from_dict(self):
         self.assertEqual(len(conf.configs), 2)
         key1 = (torch.nn.ReLU, torch.nn.Linear)
         key2 = torch.add
-        self.assertTrue(key1 in conf.configs)
-        self.assertTrue(key2 in conf.configs)
-        self.assertEqual(conf.configs[key1].to_dict(), op_dict1)
-        self.assertEqual(conf.configs[key2].to_dict(), op_dict2)
+        self.assertTrue(key1 in conf._pattern_complex_format_to_config)
+        self.assertTrue(key2 in conf._pattern_complex_format_to_config)
+        self.assertEqual(conf._pattern_complex_format_to_config[key1].to_dict(), op_dict1)
+        self.assertEqual(conf._pattern_complex_format_to_config[key2].to_dict(), op_dict2)
 
     def test_backend_config_to_dict(self):
         op1 = self._get_backend_op_config1()
 
@@ -546,9 +546,11 @@ def fuse_conv_bn_relu(is_qat, relu, add_pattern):
                 bn, conv = bn_pattern
                 return conv
 
-            conv_bn_res_relu_config1 = BackendPatternConfig((nn.ReLU, (torch.add, MatchAllNode, (nn.BatchNorm2d, nn.Conv2d)))) \
+            conv_bn_res_relu_config1 = BackendPatternConfig() \
+                ._set_pattern_complex_format((nn.ReLU, (torch.add, MatchAllNode, (nn.BatchNorm2d, nn.Conv2d)))) \
                 .set_fuser_method(fuse_conv_bn_relu)
-            conv_bn_res_relu_config2 = BackendPatternConfig((nn.ReLU, (operator.add, MatchAllNode, (nn.BatchNorm2d, nn.Conv2d)))) \
+            conv_bn_res_relu_config2 = BackendPatternConfig() \
+                ._set_pattern_complex_format((nn.ReLU, (operator.add, MatchAllNode, (nn.BatchNorm2d, nn.Conv2d)))) \
                 .set_fuser_method(fuse_conv_bn_relu)
             backend_config = BackendConfig() \
                 .set_backend_pattern_config(conv_bn_res_relu_config1) \
@@ -606,7 +608,8 @@ def conv_bn_res_relu_extra_inputs_getter(pattern):
             bn, conv = bn_pattern
             return [extra_input]
 
-        conv_bn_res_relu_config = BackendPatternConfig((nn.ReLU, (torch.add, (nn.BatchNorm2d, nn.Conv2d), MatchAllNode))) \
+        conv_bn_res_relu_config = BackendPatternConfig() \
+            ._set_pattern_complex_format((nn.ReLU, (torch.add, (nn.BatchNorm2d, nn.Conv2d), MatchAllNode))) \
             .set_fuser_method(fuse_conv_bn_relu) \
             ._set_root_node_getter(conv_bn_res_relu_root_node_getter) \
             ._set_extra_inputs_getter(conv_bn_res_relu_extra_inputs_getter)
@@ -654,7 +657,7 @@ def forward(self, x):
 
         m = M().eval()
 
-        def fuse_conv_relu(is_qat, relu, conv):
+        def fuse_conv_relu(is_qat, conv, relu):
             return conv
 
         def fuse_conv_res_relu(is_qat, relu, add_pattern):
@@ -669,9 +672,10 @@ def conv_res_relu_extra_inputs_getter(pattern):
             relu, (_, _, extra_input) = pattern
             return [extra_input]
 
-        conv_relu_config = BackendPatternConfig((nn.ReLU, nn.Conv2d)) \
+        conv_relu_config = BackendPatternConfig((nn.Conv2d, nn.ReLU)) \
             .set_fuser_method(fuse_conv_relu)
-        conv_res_relu_config = BackendPatternConfig((nn.ReLU, (torch.add, nn.Conv2d, MatchAllNode))) \
+        conv_res_relu_config = BackendPatternConfig() \
+            ._set_pattern_complex_format((nn.ReLU, (torch.add, nn.Conv2d, MatchAllNode))) \
             .set_fuser_method(fuse_conv_res_relu) \
             ._set_root_node_getter(conv_res_relu_root_node_getter) \
             ._set_extra_inputs_getter(conv_res_relu_extra_inputs_getter)
@@ -5545,10 +5549,12 @@ def root_node_getter(node_pattern):
                 return transpose
 
             backend_pattern_configs.append(
-                BackendPatternConfig((torch.reshape, torch.transpose, MatchAllNode))
-                .set_observation_type(observation_type)  # noqa: E131
+                BackendPatternConfig()
+                ._set_pattern_complex_format((torch.reshape, torch.transpose, MatchAllNode))  # noqa: E131
+                .set_observation_type(observation_type)
                 .set_dtype_configs(dtype_configs)
-                ._set_root_node_getter(root_node_getter))
+                ._set_root_node_getter(root_node_getter)
+            )
             return backend_pattern_configs
 
         backend_config = BackendConfig().set_backend_pattern_configs(_get_pattern_configs())
 
@@ -13,18 +13,18 @@
 import torch.nn.intrinsic as nni
 import torch.ao.nn.qat as nnqat
 import torch.ao.nn.qat.dynamic as nnqatd
-from torch.ao.quantization.backend_config import get_native_backend_config_dict
+from torch.ao.quantization.backend_config import get_native_backend_config
 import torch.ao.quantization.fx._lower_to_native_backend as \
     _lower_to_native_backend
 import torch.ao.quantization.quantization_mappings as quantization_mappings
 
 from .ns_types import NSNodeTargetType
 
-from typing import Set, Dict, List, Optional
+from typing import Callable, Dict, List, Optional, Set, Tuple
 
 
 def get_base_name_to_sets_of_related_ops() -> Dict[str, Set[NSNodeTargetType]]:
-    # note: this set is modified below by items from backend_config_dict
+    # note: this set is modified below by items from backend_config
     sets_of_related_ops: List[Set[NSNodeTargetType]] = [
         # conv modules
         set([
@@ -327,42 +327,36 @@ def get_base_name_to_sets_of_related_ops() -> Dict[str, Set[NSNodeTargetType]]:
     ]
 
     # for each floating point op, add versions of the op added by
-    # backend_config_dict
-    backend_config_dict = get_native_backend_config_dict()
+    # backend_config
+    backend_config = get_native_backend_config()
 
-    new_connections = [
+    new_connections: List[Tuple[Callable, Callable]] = [
         # technical debt edge case
         (nn.Linear, nn.modules.linear.NonDynamicallyQuantizableLinear),
     ]
 
-    for config in backend_config_dict['configs']:
+    for pattern, config in backend_config._pattern_complex_format_to_config.items():
 
-        if 'pattern' not in config:
-            continue
-
-        # format: (c, (b, a))
-        pattern = config['pattern']
+        # pattern format: (c, (b, a))
         first_element = pattern
         # look from the end, because pattern is in reverse order
         while isinstance(first_element, (list, tuple)):
             first_element = first_element[-1]
 
-        if 'fused_module' in config:
+        if config.fused_module is not None:
             # case 1: pattern fuses a pattern of ops into an op
             # example: nn.Conv1d, nn.ReLU fused into nni.ConvReLU1d
-            new_connections.append((first_element, config['fused_module']))
+            new_connections.append((first_element, config.fused_module))
 
-        if 'qat_module' in config:
+        if config.qat_module is not None:
             # case 2: pattern swaps a module into a QAT module
             # example: nni.ConvReLU1d swapped into nniqat.ConvReLU1d
-            new_connections.append((first_element, config['qat_module']))
+            new_connections.append((first_element, config.qat_module))
 
-        if 'reference_quantized_module_for_root' in config:
+        if config.reference_quantized_module is not None:
             # case 3: reference version of floating point module, such as
             # nn.Conv2d and nnqr.Conv2d
-            new_connections.append(
-                (first_element, config['reference_quantized_module_for_root'])
-            )
+            new_connections.append((first_element, config.reference_quantized_module))
 
     #
     # Add reference module swaps from default lowering path
@@ -413,7 +407,7 @@ def get_base_name_to_sets_of_related_ops() -> Dict[str, Set[NSNodeTargetType]]:
             new_connections.append((source, target))
 
 
-    # add the new connections from backend_config_dict
+    # add the new connections from backend_config
     for item1, item2 in new_connections:
         for set_of_related_ops in sets_of_related_ops:
             if item1 in set_of_related_ops or item2 in set_of_related_ops:
 
@@ -22,7 +22,19 @@ Instead of hardcoding the fusion mappings, float to reference quantized module m
 
 ## Pattern Specification
 
-The operator patterns used in BackendConfig are float modules, functional operators and pytorch operators specified in reverse order:
+The operator patterns used in BackendConfig are float modules, functional operators, pytorch operators, or a tuple combination of the above. For example:
+* torch.nn.Linear
+* torch.nn.functional.linear
+* torch.add
+* operator.add
+* (torch.nn.functional.linear, torch.nn.functional.relu)
+* (torch.nn.Conv2d, torch.nn.BatchNorm2d, torch.nn.ReLU)
+
+Tuple patterns are treated as sequential patterns, and currently only tuples of 2 or 3 elements are supported.
+
+### Advanced Pattern Specification
+
+The above format should satisfy the vast majority of use cases. However, it does not handle more complex scenarios such as graph patterns. For these use cases, the BackendConfig API offers an alternative "reverse nested tuple" pattern format, enabled through `BackendPatternConfig()._set_pattern_complex_format(...)`. Note that this format is deprecated and will be replaced in a future version of PyTorch.
 ```
 operator = module_type | functional | torch op | native op | MatchAllNode
 Pattern = (operator, Pattern, Pattern, ...) | operator
@@ -62,7 +74,7 @@ weighted_int8_dtype_config = DTypeConfig(
     weight_dtype=torch.qint8,
     bias_dtype=torch.float)
 
-def fuse_conv2d_relu(is_qat, relu, conv):
+def fuse_conv2d_relu(is_qat, conv, relu):
     """Return a fused ConvReLU2d from individual conv and relu modules."""
     return torch.ao.nn.intrinsic.ConvReLU2d(conv, relu)
 
@@ -75,7 +87,7 @@ linear_config = BackendPatternConfig(torch.nn.Linear) \
     .set_reference_quantized_module(torch.ao.nn.quantized.reference.Linear)
 
 # For fusing Conv2d + ReLU into ConvReLU2d
-conv_relu_config = BackendPatternConfig((torch.nn.ReLU, torch.nn.Conv2d)) \
+conv_relu_config = BackendPatternConfig((torch.nn.Conv2d, torch.nn.ReLU)) \
     .set_observation_type(ObservationType.OUTPUT_USE_DIFFERENT_OBSERVER_AS_INPUT) \
     .add_dtype_config(weighted_int8_dtype_config) \
     .set_fused_module(torch.ao.nn.intrinsic.ConvReLU2d) \
@@ -118,7 +130,7 @@ Relevant APIs:
 * `_set_root_node_getter`
 * `_set_extra_inputs_getter`
 
-As an optimization, operator patterns such as (`torch.nn.ReLU`, `torch.nn.Linear`) may be fused into `nni.LinearReLU`. This is performed during the prepare phase according to the function specified in `set_fuser_method`, which replaces the pattern with the fused module. During the convert phase, these fused modules (identified by `set_fused_module`) will then be converted to the reference quantized versions of the modules.
+As an optimization, operator patterns such as (`torch.nn.Linear`, `torch.nn.ReLU`) may be fused into `nni.LinearReLU`. This is performed during the prepare phase according to the function specified in `set_fuser_method`, which replaces the pattern with the fused module. During the convert phase, these fused modules (identified by `set_fused_module`) will then be converted to the reference quantized versions of the modules.
 
 In FX graph mode quantization, we replace the corresponding nodes in the graph using two helper functions set by the user: `root_node_getter`, which returns the root node (typically the weighted module in the pattern like `torch.nn.Linear`) to replace the matched pattern in the graph, and `extra_inputs_getter`, which returns a list of extra input arguments that will be appended to the existing arguments of the fused module (copied over from the root node). See [this snippet](https://gist.github.com/jerryzh168/8bea7180a8ba3c279f2c9b050f2a69a6) for an example usage.