Quantization: preserving pre and post forward hooks (#37233)

zetyquickly · facebook-github-bot · commit 0c77bd7c0bbd · 2020-07-13T12:41:24.000-07:00
Summary: 1. While do convert() preserve module's **pre and post forward** hooks 2. While do fusion preserve only module's **pre forward** hooks (because after fusion output no longer the same) Pull Request resolved: #37233 Differential Revision: D22425141 Pulled By: jerryzh168 fbshipit-source-id: e69b81821d507dcd110d2ff3594ba94b9593c8da
diff --git a/test/quantization/test_quantize.py b/test/quantization/test_quantize.py
@@ -61,6 +61,7 @@
 from torch.testing._internal.common_quantized import (
     override_quantized_engine,
     supported_qengines,
+    override_qengines,
 )
 from torch.testing._internal.common_utils import TemporaryFileName
 from torch.testing._internal.common_utils import suppress_warnings
@@ -445,6 +446,55 @@ def checkQuantized(model):
                                  self.calib_data)
         checkQuantized(model_oneline)
 
+    @override_qengines
+    def test_forward_hooks_preserved(self):
+        r"""Test post-training static quantization on preserving 
+        pre forward and post forward hooks of original model
+        """
+        qengine = torch.backends.quantized.engine
+        model = QuantStubModel()
+        counter = {
+            'pre_forwards': 0,
+            'forwards': 0,
+        }
+
+        def fw_pre_hook(h_module, input):
+            counter['pre_forwards'] += 1
+
+        def fw_hook(h_module, input, output):
+            counter['forwards'] += 1
+
+        model.fc.register_forward_pre_hook(fw_pre_hook)
+        model.fc.register_forward_hook(fw_hook)
+
+        model.qconfig = torch.quantization.get_default_qconfig(qengine)
+        model = prepare(model)
+
+        def checkHooksIsPresent(model, before_convert=True):
+            num_fwd_hooks = 1
+            if before_convert:
+                self.assertEqual(len(model.quant._forward_hooks.values()), 1,
+                                 "Quantization observer hook has disappeared")
+                num_fwd_hooks = 2
+
+            self.assertObjectIn(fw_pre_hook, model.fc._forward_pre_hooks.values())
+            self.assertObjectIn(fw_hook, model.fc._forward_hooks.values())
+            self.assertEqual(len(model.fc._forward_pre_hooks.values()), 1,
+                             "Extra pre forward hooks have appeared on a layer")
+            # During static quantization non stub layers are provided with quantization observer hook too
+            self.assertEqual(len(model.fc._forward_hooks.values()), num_fwd_hooks,
+                             "Extra post forward hooks have appeared on a layer")
+            # Implicitly check that fw_hook goes after _observer_forward_hook 
+            self.assertEqual(list(model.fc._forward_hooks.values())[-1], fw_hook,
+                             "_observer_forward_hook is not a first entry of the hooks list")
+
+        checkHooksIsPresent(model, True)
+        test_only_eval_fn(model, self.calib_data)
+        torch.quantization.convert(model, inplace=True)
+        checkHooksIsPresent(model, False)
+
+
+
 @skipIfNoFBGEMM
 class TestPostTrainingDynamic(QuantizationTestCase):
     def test_single_layer(self):
@@ -752,6 +802,46 @@ def checkQuantized(model, module_type):
             self.checkScriptable(model_quantized, [[x]], check_save_load=True)
 
 
+    def test_forward_hooks_preserved(self):
+        r"""Test post-training dynamic quantization on preserving 
+        pre forward and post forward hooks of original model
+        """
+        for dtype in [torch.qint8, torch.float16]:
+            model = SingleLayerLinearDynamicModel().eval()
+            qconfig = float16_dynamic_qconfig if dtype == torch.float16 else default_dynamic_qconfig
+            qconfig_dict = {
+                'fc1': qconfig
+            }
+            convert_dynamic(model)
+
+            counter = {
+                'pre_forwards': 0,
+                'forwards': 0,
+            }
+
+            def fw_pre_hook(h_module, input):
+                counter['pre_forwards'] += 1
+
+            def fw_hook(h_module, input, output):
+                counter['forwards'] += 1
+
+            model.fc1.register_forward_pre_hook(fw_pre_hook)
+            model.fc1.register_forward_hook(fw_hook)
+            prepare_dynamic(model, qconfig_dict)
+
+            def checkHooksIsPresent(model):
+                self.assertObjectIn(fw_pre_hook, model.fc1._forward_pre_hooks.values())
+                self.assertObjectIn(fw_hook, model.fc1._forward_hooks.values())
+                self.assertEqual(len(model.fc1._forward_pre_hooks.values()), 1,
+                                 "Extra pre forward hooks have appeared on a layer")
+                self.assertEqual(len(model.fc1._forward_hooks.values()), 1,
+                                 "Extra post forward hooks have appeared on a layer")
+
+            checkHooksIsPresent(model)
+            test_only_eval_fn(model, self.calib_data)
+            convert_dynamic(model)
+            checkHooksIsPresent(model)
+
 class TestQuantizationAwareTraining(QuantizationTestCase):
     def test_manual(self):
         for qengine in supported_qengines:
@@ -864,6 +954,45 @@ def test_train_save_load_eval(self):
                 out = model(x)
                 self.assertEqual(ref, out)
 
+    @override_qengines
+    def test_forward_hooks_preserved(self):
+        r"""Test QAT on preserving pre forward and post forward hooks of original model
+        """
+        qengine = torch.backends.quantized.engine
+        model = QuantStubModel()
+        counter = {
+            'pre_forwards': 0,
+            'forwards': 0,
+        }
+
+        def fw_pre_hook(h_module, input):
+            counter['pre_forwards'] += 1
+
+        def fw_hook(h_module, input, output):
+            counter['forwards'] += 1
+
+        model.fc.register_forward_pre_hook(fw_pre_hook)
+        model.fc.register_forward_hook(fw_hook)
+
+        model.qconfig = torch.quantization.get_default_qat_qconfig(qengine)
+        model = prepare_qat(model)
+
+        def checkHooksIsPresent(model, before_convert=True):
+            if before_convert:
+                self.assertEqual(len(model.quant._forward_hooks.values()), 1,
+                                 "Quantization observer hook has disappeared")
+            self.assertObjectIn(fw_pre_hook, model.fc._forward_pre_hooks.values())
+            self.assertObjectIn(fw_hook, model.fc._forward_hooks.values())
+            self.assertEqual(len(model.fc._forward_pre_hooks.values()), 1,
+                             "Extra pre forward hooks have appeared on a layer")
+            self.assertEqual(len(model.fc._forward_hooks.values()), 1,
+                             "Extra post forward hooks have appeared on a layer")
+
+        checkHooksIsPresent(model, True)
+        x = torch.rand(2, 5, dtype=torch.float)
+        model(x)
+        torch.quantization.convert(model, inplace=True)
+        checkHooksIsPresent(model, False)
 
 class TestFunctionalModule(QuantizationTestCase):
     # Histogram Observers are slow, so have no-deadline to ensure test doesn't time out
@@ -1156,6 +1285,52 @@ def checkQAT(model):
 
                 checkQAT(model)
 
+    def test_forward_hooks_preserved(self):
+        r"""Test case that checks whether forward pre hooks of the first module and
+        post forward hooks of the last module in modules list passed to fusion function preserved.
+        (e.g. before fusion: [nn.Conv2d (with pre forward hooks), nn.BatchNorm2d, nn.ReLU (with post forward hooks)] 
+        after fusion: [nni.ConvBnReLU2d (with pre and post hooks), nn.Identity, nn.Identity])
+        """
+        model = ModelForFusion(default_qat_qconfig).train()
+
+        counter = {
+            'pre_forwards': 0,
+            'forwards': 0,
+        }
+        fused = False
+
+        def fw_pre_hook(fused_module_class, h_module, input):
+            if fused:
+                self.assertEqual(type(h_module), fused_module_class,
+                                 "After fusion owner of the first module's forward pre hook is not a fused module")
+            counter['pre_forwards'] += 1
+
+        def fw_hook(fused_module_class, h_module, input, output):
+            if fused:
+                self.assertEqual(type(h_module), fused_module_class,
+                                 "After fusion owner of the last module's forward hook is not a fused module")
+            counter['forwards'] += 1
+
+        # Registering two pre and two post forward hooks, thus expecting counter increment by two each inference
+        model.conv1.register_forward_pre_hook(lambda *args: fw_pre_hook(nni.ConvBnReLU2d, *args))
+        model.sub1.conv.register_forward_pre_hook(lambda *args: fw_pre_hook(nni.ConvBn2d, *args))
+        model.relu1.register_forward_hook(lambda *args: fw_hook(nni.ConvBnReLU2d, *args))
+        model.sub1.bn.register_forward_hook(lambda *args: fw_hook(nni.ConvBn2d, *args))
+
+        test_only_eval_fn(model, self.img_data_1d)
+        self.assertEqual(counter['pre_forwards'], 2 * len(self.img_data_1d))
+        self.assertEqual(counter['forwards'], 2 * len(self.img_data_1d))
+
+        model = fuse_modules(model, ['conv1', 'bn1', 'relu1'])
+        model = fuse_modules(model, ['sub1.conv', 'sub1.bn'])
+
+        fused = True
+        before_fusion_pre_count = counter['pre_forwards']
+        before_fusion_post_count = counter['forwards']
+        test_only_eval_fn(model, self.img_data_1d)
+        self.assertEqual(counter['pre_forwards'] - before_fusion_pre_count, 2 * len(self.img_data_1d))
+        self.assertEqual(counter['forwards'] - before_fusion_post_count, 2 * len(self.img_data_1d))
+
 class TestModelNumerics(QuantizationTestCase):
     def test_float_quant_compare_per_tensor(self):
         for qengine in supported_qengines:
diff --git a/torch/quantization/fuse_modules.py b/torch/quantization/fuse_modules.py
@@ -124,6 +124,15 @@ def fuse_known_modules(mod_list):
         raise NotImplementedError("Cannot fuse modules: {}".format(types))
     new_mod = [None] * len(mod_list)
     new_mod[0] = fuser_method(*mod_list)
+    # NOTE: forward hooks not processed in the two following for loops will be lost after the fusion
+    # Move pre forward hooks of the base module to resulting fused module
+    for handle_id, pre_hook_fn in mod_list[0]._forward_pre_hooks.items():
+        new_mod[0].register_forward_pre_hook(pre_hook_fn)
+        del mod_list[0]._forward_pre_hooks[handle_id]
+    # Move post forward hooks of the last module to resulting fused module
+    for handle_id, hook_fn in mod_list[-1]._forward_hooks.items():
+        new_mod[0].register_forward_hook(hook_fn)
+        del mod_list[-1]._forward_hooks[handle_id]
 
     for i in range(1, len(mod_list)):
         new_mod[i] = torch.nn.Identity()
diff --git a/torch/quantization/quantize.py b/torch/quantization/quantize.py
@@ -119,7 +119,10 @@ def add_observer_(module, non_leaf_module_list=None, device=None):
         if device is not None:
             activation.to(device)
         module.add_module('activation_post_process', activation)
-        module.register_forward_hook(_observer_forward_hook)
+        # Register observer as the first entry in the hook list
+        # All post forward hooks are preserved and will be executed after the observer before convert
+        handle = module.register_forward_hook(_observer_forward_hook)
+        module._forward_hooks.move_to_end(handle.id, last=False)
 
 def get_unique_devices_(module):
     return {p.device for p in module.parameters()} | \
@@ -393,6 +396,14 @@ def swap_module(mod, mapping):
             )
             device = next(iter(devices)) if len(devices) > 0 else None
             new_mod = mapping[type(mod)].from_float(mod)
+            # Preserve module's pre forward hooks. They'll be called on quantized input
+            for pre_hook_fn in mod._forward_pre_hooks.values():
+                new_mod.register_forward_pre_hook(pre_hook_fn)
+            # Preserve module's post forward hooks except _observer_forward_hook
+            # After convert they'll work with quantized output
+            for hook_fn in mod._forward_hooks.values():
+                if hook_fn is not _observer_forward_hook:
+                    new_mod.register_forward_hook(hook_fn)
             if device:
                 new_mod.to(device)
     return new_mod