Fix bug in profiler and task init code

mannatsingh · facebook-github-bot · commit d2016efebd28 · 2020-03-10T18:51:08.000-07:00
Differential Revision:
D20342756

Profiler update

fbshipit-source-id: 3e4dcb31f1cbf824fca3b74467ed8940f472029c
diff --git a/classy_vision/generic/profiler.py b/classy_vision/generic/profiler.py
@@ -10,7 +10,12 @@
 
 import torch
 import torch.nn as nn
-from classy_vision.generic.util import get_model_dummy_input, is_leaf, is_on_gpu
+from classy_vision.generic.util import (
+    get_model_dummy_input,
+    is_leaf,
+    is_on_gpu,
+    train_mode,
+)
 from torch.cuda import cudart
 
 
@@ -24,7 +29,6 @@ def profile(
     """
     Performs CPU or GPU profiling of the specified model on the specified input.
     """
-
     # assertions:
     if use_nvprof:
         raise NotImplementedError
@@ -41,18 +45,19 @@ def profile(
         batchsize=batchsize_per_replica,
         non_blocking=False,
     )
-    # perform profiling:
-    with torch.no_grad():
-        model(input)  # warm up CUDA memory allocator and profiler
-        if use_nvprof:  # nvprof profiling (TODO: Can we infer this?)
-            cudart().cudaProfilerStart()
-            model(input)
-            cudart().cudaProfilerStop()
-            exit()  # exit gracefully
-        else:  # regular profiling
-            with torch.autograd.profiler.profile(use_cuda=True) as profiler:
+    # perform profiling in eval mode
+    with train_mode(model, False):
+        with torch.no_grad():
+            model(input)  # warm up CUDA memory allocator and profiler
+            if use_nvprof:  # nvprof profiling (TODO: Can we infer this?)
+                cudart().cudaProfilerStart()
                 model(input)
-                return profiler
+                cudart().cudaProfilerStop()
+                exit()  # exit gracefully
+            else:  # regular profiling
+                with torch.autograd.profiler.profile(use_cuda=True) as profiler:
+                    model(input)
+                    return profiler
 
 
 def _get_batchsize_per_replica(x):
@@ -376,7 +381,6 @@ def compute_complexity(model, compute_fn, input_shape, input_key=None):
     """
     Compute the complexity of a forward pass.
     """
-
     # assertions, input, and upvalue in which we will perform the count:
     assert isinstance(model, nn.Module)
     if not isinstance(input_shape, abc.Sequence):
@@ -387,7 +391,10 @@ def compute_complexity(model, compute_fn, input_shape, input_key=None):
     # measure FLOPs:
     modify_forward(model, compute_list, compute_fn)
     try:
-        model.forward(input)
+        # compute complexity in eval mode
+        with train_mode(model, False):
+            with torch.no_grad():
+                model.forward(input)
     except NotImplementedError as err:
         raise err
     finally:
diff --git a/classy_vision/generic/util.py b/classy_vision/generic/util.py
@@ -774,3 +774,18 @@ def get_model_dummy_input(
         if input_key:
             input = {input_key: input}
     return input
+
+
+@contextlib.contextmanager
+def train_mode(model: nn.Module, train_mode: bool):
+    """Context manager which sets the train mode of a model. After returning, it
+    restores the state of every module inside the model individually."""
+    train_modes = {}
+    for name, module in model.named_modules():
+        train_modes[name] = module.training
+    try:
+        model.train(train_mode)
+        yield
+    finally:
+        for name, module in model.named_modules():
+            module.training = train_modes[name]
diff --git a/classy_vision/tasks/classification_task.py b/classy_vision/tasks/classification_task.py
@@ -23,7 +23,6 @@
     recursive_copy_to_gpu,
     update_classy_state,
 )
-from classy_vision.hooks import ClassyHookFunctions
 from classy_vision.losses import ClassyLoss, build_loss
 from classy_vision.meters import build_meters
 from classy_vision.models import ClassyModel, build_model
@@ -305,9 +304,6 @@ def from_config(cls, config: Dict[str, Any]) -> "ClassificationTask":
         amp_opt_level = config.get("amp_opt_level")
         meters = build_meters(config.get("meters", {}))
         model = build_model(config["model"])
-        # put model in eval mode in case any hooks modify model states, it'll
-        # be reset to train mode before training
-        model.eval()
         optimizer = build_optimizer(optimizer_config)
 
         task = (
diff --git a/test/generic_util_test.py b/test/generic_util_test.py
@@ -4,6 +4,7 @@
 # This source code is licensed under the MIT license found in the
 # LICENSE file in the root directory of this source tree.
 
+import copy
 import shutil
 import tempfile
 import unittest
@@ -14,6 +15,7 @@
 
 import classy_vision.generic.util as util
 import torch
+import torch.nn as nn
 from classy_vision.generic.util import (
     CHECKPOINT_FILE,
     load_checkpoint,
@@ -368,6 +370,52 @@ def test_get_model_dummy_input(self):
             )
             self.assertEqual(result.size(), tuple([batchsize] + input_shape))
 
+    def _compare_model_train_mode(self, model_1, model_2):
+        for name_1, module_1 in model_1.named_modules():
+            found = False
+            for name_2, module_2 in model_2.named_modules():
+                if name_1 == name_2:
+                    found = True
+                    if module_1.training != module_2.training:
+                        return False
+            if not found:
+                return False
+        return True
+
+    def _check_model_train_mode(self, model, expected_mode):
+        for module in model.modules():
+            if module.training != expected_mode:
+                return False
+        return True
+
+    def test_train_mode(self):
+        class TestModel(nn.Module):
+            def __init__(self):
+                super().__init__()
+                self.linear = nn.Linear(1, 2)
+                self.dropout = nn.Dropout()
+                self.seq = nn.Sequential(
+                    nn.ReLU(), nn.Conv2d(1, 2, 3), nn.BatchNorm2d(1, 2)
+                )
+
+        test_model = TestModel()
+        for train in [True, False]:
+            test_model.train(train)
+
+            # flip some of the modes
+            test_model.dropout.train(not train)
+            test_model.seq[1].train(not train)
+
+            orig_model = copy.deepcopy(test_model)
+            for context_train in [True, False]:
+                with util.train_mode(test_model, context_train):
+                    self._check_model_train_mode(test_model, context_train)
+                    # the modes should be different inside the context manager
+                    self.assertFalse(
+                        self._compare_model_train_mode(orig_model, test_model)
+                    )
+                self.assertTrue(self._compare_model_train_mode(orig_model, test_model))
+
 
 class TestUpdateStateFunctions(unittest.TestCase):
     def _compare_states(self, state_1, state_2, check_heads=True):