From 6eb762af6283eeb1c39682a683b7bcd7fa4e94f4 Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Mon, 8 Mar 2021 14:31:06 +0000
Subject: [PATCH 01/10] refactor test_models to use pytest

---
 .circleci/unittest/linux/scripts/install.sh   |  2 +-
 .circleci/unittest/windows/scripts/install.sh |  2 +-
 test/test_models.py                           | 61 ++++++++-----------
 3 files changed, 27 insertions(+), 38 deletions(-)

diff --git a/.circleci/unittest/linux/scripts/install.sh b/.circleci/unittest/linux/scripts/install.sh
index 1a3e5c6f4d2..527bbc1f5fe 100755
--- a/.circleci/unittest/linux/scripts/install.sh
+++ b/.circleci/unittest/linux/scripts/install.sh
@@ -24,7 +24,7 @@ else
 fi
 
 printf "Installing PyTorch with %s\n" "${cudatoolkit}"
-conda install -y -c "pytorch-${UPLOAD_CHANNEL}" -c conda-forge "pytorch-${UPLOAD_CHANNEL}"::pytorch "${cudatoolkit}"
+conda install -y -c "pytorch-${UPLOAD_CHANNEL}" -c conda-forge "pytorch-${UPLOAD_CHANNEL}"::pytorch "${cudatoolkit}" pytest
 
 printf "* Installing torchvision\n"
 python setup.py develop
diff --git a/.circleci/unittest/windows/scripts/install.sh b/.circleci/unittest/windows/scripts/install.sh
index 9304b4b9b65..f24a5942f3a 100644
--- a/.circleci/unittest/windows/scripts/install.sh
+++ b/.circleci/unittest/windows/scripts/install.sh
@@ -26,7 +26,7 @@ else
 fi
 
 printf "Installing PyTorch with %s\n" "${cudatoolkit}"
-conda install -y -c "pytorch-${UPLOAD_CHANNEL}" -c conda-forge "pytorch-${UPLOAD_CHANNEL}"::pytorch "${cudatoolkit}"
+conda install -y -c "pytorch-${UPLOAD_CHANNEL}" -c conda-forge "pytorch-${UPLOAD_CHANNEL}"::pytorch "${cudatoolkit}" pytest
 
 printf "* Installing torchvision\n"
 "$this_dir/vc_env_helper.bat" python setup.py develop
diff --git a/test/test_models.py b/test/test_models.py
index 9b26839fa0b..bb876715b73 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -9,6 +9,8 @@
 import unittest
 import warnings
 
+import pytest
+
 
 def get_available_classification_models():
     # TODO add a registration mechanism to torchvision.models
@@ -429,50 +431,37 @@ def test_generalizedrcnn_transform_repr(self):
 _devs = [torch.device("cpu"), torch.device("cuda")] if torch.cuda.is_available() else [torch.device("cpu")]
 
 
-for model_name in get_available_classification_models():
-    for dev in _devs:
-        # for-loop bodies don't define scopes, so we have to save the variables
-        # we want to close over in some way
-        def do_test(self, model_name=model_name, dev=dev):
-            input_shape = (1, 3, 224, 224)
-            if model_name in ['inception_v3']:
-                input_shape = (1, 3, 299, 299)
-            self._test_classification_model(model_name, input_shape, dev)
-
-        setattr(ModelTester, f"test_{model_name}_{dev}", do_test)
-
-
-for model_name in get_available_segmentation_models():
-    for dev in _devs:
-        # for-loop bodies don't define scopes, so we have to save the variables
-        # we want to close over in some way
-        def do_test(self, model_name=model_name, dev=dev):
-            self._test_segmentation_model(model_name, dev)
+@pytest.mark.parametrize('model_name', get_available_classification_models())
+@pytest.mark.parametrize('dev', _devs)
+@pytest.mark.xfail(reason='The test fails because its name changed and an expected file doesnt exist yet')
+def test_classification_model(model_name, dev):
+    input_shape = (1, 3, 224, 224) if model_name == 'inception_v3' else (1, 3, 299, 299)
+    ModelTester()._test_classification_model(model_name, input_shape, dev)
 
-        setattr(ModelTester, f"test_{model_name}_{dev}", do_test)
 
+@pytest.mark.parametrize('model_name', get_available_segmentation_models())
+@pytest.mark.parametrize('dev', _devs)
+@pytest.mark.xfail(reason='The test fails because its name changed and an expected file doesnt exist yet')
+def test_segmentation_model(model_name, dev):
+    ModelTester()._test_segmentation_model(model_name, dev)
 
-for model_name in get_available_detection_models():
-    for dev in _devs:
-        # for-loop bodies don't define scopes, so we have to save the variables
-        # we want to close over in some way
-        def do_test(self, model_name=model_name, dev=dev):
-            self._test_detection_model(model_name, dev)
 
-        setattr(ModelTester, f"test_{model_name}_{dev}", do_test)
+@pytest.mark.parametrize('model_name', get_available_detection_models())
+@pytest.mark.parametrize('dev', _devs)
+def test_detection_model(model_name, dev):
+    ModelTester()._test_detection_model(model_name, dev)
 
-    def do_validation_test(self, model_name=model_name):
-        self._test_detection_model_validation(model_name)
 
-    setattr(ModelTester, "test_" + model_name + "_validation", do_validation_test)
+@pytest.mark.parametrize('model_name', get_available_detection_models())
+def test_detection_model_validation(model_name):
+    ModelTester()._test_detection_model_validation(model_name)
 
 
-for model_name in get_available_video_models():
-    for dev in _devs:
-        def do_test(self, model_name=model_name, dev=dev):
-            self._test_video_model(model_name, dev)
+@pytest.mark.parametrize('model_name', get_available_video_models())
+@pytest.mark.parametrize('dev', _devs)
+def test_video_model(model_name, dev):
+    ModelTester()._test_video_model(model_name, dev)
 
-        setattr(ModelTester, f"test_{model_name}_{dev}", do_test)
 
 if __name__ == '__main__':
-    unittest.main()
+    pytest.main([__file__])

From 8465e467237438145f936c529982bd7ff2f33d8a Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Mon, 8 Mar 2021 14:48:53 +0000
Subject: [PATCH 02/10] Also xfail the detection models

---
 test/test_models.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/test/test_models.py b/test/test_models.py
index bb876715b73..736a85fbbbf 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -448,6 +448,7 @@ def test_segmentation_model(model_name, dev):
 
 @pytest.mark.parametrize('model_name', get_available_detection_models())
 @pytest.mark.parametrize('dev', _devs)
+@pytest.mark.xfail(reason='The test fails because its name changed and an expected file doesnt exist yet')
 def test_detection_model(model_name, dev):
     ModelTester()._test_detection_model(model_name, dev)
 

From 6837001c4b4afd999cc04169562e76b94ebf18ab Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Mon, 8 Mar 2021 15:23:54 +0000
Subject: [PATCH 03/10] Remove xfail and just comment out expected failing
 parts

---
 test/test_models.py | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/test/test_models.py b/test/test_models.py
index 736a85fbbbf..a4c7a3b15ed 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -80,7 +80,7 @@ def _test_classification_model(self, name, input_shape, dev):
         # RNG always on CPU, to ensure x in cuda tests is bitwise identical to x in cpu tests
         x = torch.rand(input_shape).to(device=dev)
         out = model(x)
-        self.assertExpected(out.cpu(), prec=0.1, strip_suffix=f"_{dev}")
+        # self.assertExpected(out.cpu(), prec=0.1, strip_suffix=f"_{dev}")
         self.assertEqual(out.shape[-1], 50)
         self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(name, None))
 
@@ -110,7 +110,8 @@ def check_out(out):
                 # We first try to assert the entire output if possible. This is not
                 # only the best way to assert results but also handles the cases
                 # where we need to create a new expected result.
-                self.assertExpected(out.cpu(), prec=prec, strip_suffix=strip_suffix)
+                # self.assertExpected(out.cpu(), prec=prec, strip_suffix=strip_suffix)
+                pass
             except AssertionError:
                 # Unfortunately some segmentation models are flaky with autocast
                 # so instead of validating the probability scores, check that the class
@@ -195,7 +196,8 @@ def compute_mean_std(tensor):
                 # We first try to assert the entire output if possible. This is not
                 # only the best way to assert results but also handles the cases
                 # where we need to create a new expected result.
-                self.assertExpected(output, prec=prec, strip_suffix=strip_suffix)
+                # self.assertExpected(output, prec=prec, strip_suffix=strip_suffix)
+                pass
             except AssertionError:
                 # Unfortunately detection models are flaky due to the unstable sort
                 # in NMS. If matching across all outputs fails, use the same approach
@@ -433,7 +435,6 @@ def test_generalizedrcnn_transform_repr(self):
 
 @pytest.mark.parametrize('model_name', get_available_classification_models())
 @pytest.mark.parametrize('dev', _devs)
-@pytest.mark.xfail(reason='The test fails because its name changed and an expected file doesnt exist yet')
 def test_classification_model(model_name, dev):
     input_shape = (1, 3, 224, 224) if model_name == 'inception_v3' else (1, 3, 299, 299)
     ModelTester()._test_classification_model(model_name, input_shape, dev)
@@ -441,14 +442,12 @@ def test_classification_model(model_name, dev):
 
 @pytest.mark.parametrize('model_name', get_available_segmentation_models())
 @pytest.mark.parametrize('dev', _devs)
-@pytest.mark.xfail(reason='The test fails because its name changed and an expected file doesnt exist yet')
 def test_segmentation_model(model_name, dev):
     ModelTester()._test_segmentation_model(model_name, dev)
 
 
 @pytest.mark.parametrize('model_name', get_available_detection_models())
 @pytest.mark.parametrize('dev', _devs)
-@pytest.mark.xfail(reason='The test fails because its name changed and an expected file doesnt exist yet')
 def test_detection_model(model_name, dev):
     ModelTester()._test_detection_model(model_name, dev)
 

From fff4683824f7e92e7fcb7bc2fdda1f479ed17939 Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Mon, 8 Mar 2021 16:03:22 +0000
Subject: [PATCH 04/10] Comment out some more

---
 test/test_models.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/test/test_models.py b/test/test_models.py
index a4c7a3b15ed..c8e3b440ab2 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -88,8 +88,8 @@ def _test_classification_model(self, name, input_shape, dev):
             with torch.cuda.amp.autocast():
                 out = model(x)
                 # See autocast_flaky_numerics comment at top of file.
-                if name not in autocast_flaky_numerics:
-                    self.assertExpected(out.cpu(), prec=0.1, strip_suffix=f"_{dev}")
+                # if name not in autocast_flaky_numerics:
+                #     self.assertExpected(out.cpu(), prec=0.1, strip_suffix=f"_{dev}")
                 self.assertEqual(out.shape[-1], 50)
 
     def _test_segmentation_model(self, name, dev):

From c7a933810827c62d5ef719a4a0f131be3493d7d5 Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Tue, 20 Apr 2021 14:55:41 +0100
Subject: [PATCH 05/10] put back commented checks

---
 test/common_utils.py | 29 +++++-------------------
 test/test_models.py  | 53 +++++++++++++++++++++-----------------------
 2 files changed, 30 insertions(+), 52 deletions(-)

diff --git a/test/common_utils.py b/test/common_utils.py
index 7e16864d56c..d20231f10eb 100644
--- a/test/common_utils.py
+++ b/test/common_utils.py
@@ -100,28 +100,18 @@ def is_iterable(obj):
 class TestCase(unittest.TestCase):
     precision = 1e-5
 
-    def _get_expected_file(self, subname=None, strip_suffix=None):
-        def remove_prefix_suffix(text, prefix, suffix):
-            if text.startswith(prefix):
-                text = text[len(prefix):]
-            if suffix is not None and text.endswith(suffix):
-                text = text[:len(text) - len(suffix)]
-            return text
+    def _get_expected_file(self, model_name=None):
         # NB: we take __file__ from the module that defined the test
         # class, so we place the expect directory where the test script
         # lives, NOT where test/common_utils.py lives.
         module_id = self.__class__.__module__
-        munged_id = remove_prefix_suffix(self.id(), module_id + ".", strip_suffix)
 
         # Determine expected file based on environment
         expected_file_base = get_relative_path(
             os.path.realpath(sys.modules[module_id].__file__),
             "expect")
 
-        # Set expected_file based on subname.
-        expected_file = os.path.join(expected_file_base, munged_id)
-        if subname:
-            expected_file += "_" + subname
+        expected_file = expected_file = os.path.join(expected_file_base, 'ModelTester.test_' + model_name)
         expected_file += "_expect.pkl"
 
         if not ACCEPT and not os.path.exists(expected_file):
@@ -132,25 +122,16 @@ def remove_prefix_suffix(text, prefix, suffix):
 
         return expected_file
 
-    def assertExpected(self, output, subname=None, prec=None, strip_suffix=None):
+    def assertExpected(self, output, model_name, prec=None):
         r"""
         Test that a python value matches the recorded contents of a file
-        derived from the name of this test and subname.  The value must be
+        derived from a model name. The value must be
         pickable with `torch.save`. This file
         is placed in the 'expect' directory in the same directory
         as the test script. You can automatically update the recorded test
         output using --accept.
-
-        If you call this multiple times in a single function, you must
-        give a unique subname each time.
-
-        strip_suffix allows different tests that expect similar numerics, e.g.
-        "test_xyz_cuda" and "test_xyz_cpu", to use the same pickled data.
-        test_xyz_cuda would pass strip_suffix="_cuda", test_xyz_cpu would pass
-        strip_suffix="_cpu", and they would both use a data file name based on
-        "test_xyz".
         """
-        expected_file = self._get_expected_file(subname, strip_suffix)
+        expected_file = self._get_expected_file(model_name)
 
         if ACCEPT:
             filename = {os.path.basename(expected_file)}
diff --git a/test/test_models.py b/test/test_models.py
index d7fd0e8d8d6..89b9414df15 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -72,32 +72,32 @@ def get_available_video_models():
 
 
 class ModelTester(TestCase):
-    def _test_classification_model(self, name, input_shape, dev):
+    def _test_classification_model(self, model_name, input_shape, dev):
         set_rng_seed(0)
         # passing num_class equal to a number other than 1000 helps in making the test
         # more enforcing in nature
-        model = models.__dict__[name](num_classes=50)
+        model = models.__dict__[model_name](num_classes=50)
         model.eval().to(device=dev)
         # RNG always on CPU, to ensure x in cuda tests is bitwise identical to x in cpu tests
         x = torch.rand(input_shape).to(device=dev)
         out = model(x)
-        # self.assertExpected(out.cpu(), prec=0.1, strip_suffix=f"_{dev}")
+        self.assertExpected(out.cpu(), model_name, prec=0.1)
         self.assertEqual(out.shape[-1], 50)
-        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(name, None))
+        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(model_name, None))
 
         if dev == torch.device("cuda"):
             with torch.cuda.amp.autocast():
                 out = model(x)
                 # See autocast_flaky_numerics comment at top of file.
-                # if name not in autocast_flaky_numerics:
-                #     self.assertExpected(out.cpu(), prec=0.1, strip_suffix=f"_{dev}")
+                if model_name not in autocast_flaky_numerics:
+                    self.assertExpected(out.cpu(), model_name, prec=0.1)
                 self.assertEqual(out.shape[-1], 50)
 
-    def _test_segmentation_model(self, name, dev):
+    def _test_segmentation_model(self, model_name, dev):
         set_rng_seed(0)
         # passing num_classes equal to a number other than 21 helps in making the test's
         # expected file size smaller
-        model = models.segmentation.__dict__[name](num_classes=10, pretrained_backbone=False)
+        model = models.segmentation.__dict__[model_name](num_classes=10, pretrained_backbone=False)
         model.eval().to(device=dev)
         input_shape = (1, 3, 32, 32)
         # RNG always on CPU, to ensure x in cuda tests is bitwise identical to x in cpu tests
@@ -106,18 +106,16 @@ def _test_segmentation_model(self, name, dev):
 
         def check_out(out):
             prec = 0.01
-            strip_suffix = f"_{dev}"
             try:
                 # We first try to assert the entire output if possible. This is not
                 # only the best way to assert results but also handles the cases
                 # where we need to create a new expected result.
-                # self.assertExpected(out.cpu(), prec=prec, strip_suffix=strip_suffix)
-                pass
+                self.assertExpected(out.cpu(), model_name, prec=prec)
             except AssertionError:
                 # Unfortunately some segmentation models are flaky with autocast
                 # so instead of validating the probability scores, check that the class
                 # predictions match.
-                expected_file = self._get_expected_file(strip_suffix=strip_suffix)
+                expected_file = self._get_expected_file(model_name)
                 expected = torch.load(expected_file)
                 self.assertEqual(out.argmax(dim=1), expected.argmax(dim=1), prec=prec)
                 return False  # Partial validation performed
@@ -126,13 +124,13 @@ def check_out(out):
 
         full_validation = check_out(out)
 
-        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(name, None))
+        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(model_name, None))
 
         if dev == torch.device("cuda"):
             with torch.cuda.amp.autocast():
                 out = model(x)["out"]
                 # See autocast_flaky_numerics comment at top of file.
-                if name not in autocast_flaky_numerics:
+                if model_name not in autocast_flaky_numerics:
                     full_validation &= check_out(out)
 
         if not full_validation:
@@ -143,18 +141,18 @@ def check_out(out):
             warnings.warn(msg, RuntimeWarning)
             raise unittest.SkipTest(msg)
 
-    def _test_detection_model(self, name, dev):
+    def _test_detection_model(self, model_name, dev):
         set_rng_seed(0)
         kwargs = {}
-        if "retinanet" in name:
+        if "retinanet" in model_name:
             # Reduce the default threshold to ensure the returned boxes are not empty.
             kwargs["score_thresh"] = 0.01
-        elif "fasterrcnn_mobilenet_v3_large" in name:
+        elif "fasterrcnn_mobilenet_v3_large" in model_name:
             kwargs["box_score_thresh"] = 0.02076
-            if "fasterrcnn_mobilenet_v3_large_320_fpn" in name:
+            if "fasterrcnn_mobilenet_v3_large_320_fpn" in model_name:
                 kwargs["rpn_pre_nms_top_n_test"] = 1000
                 kwargs["rpn_post_nms_top_n_test"] = 1000
-        model = models.detection.__dict__[name](num_classes=50, pretrained_backbone=False, **kwargs)
+        model = models.detection.__dict__[model_name](num_classes=50, pretrained_backbone=False, **kwargs)
         model.eval().to(device=dev)
         input_shape = (3, 300, 300)
         # RNG always on CPU, to ensure x in cuda tests is bitwise identical to x in cpu tests
@@ -192,19 +190,18 @@ def compute_mean_std(tensor):
 
             output = map_nested_tensor_object(out, tensor_map_fn=compact)
             prec = 0.01
-            strip_suffix = f"_{dev}"
             try:
                 # We first try to assert the entire output if possible. This is not
                 # only the best way to assert results but also handles the cases
                 # where we need to create a new expected result.
-                # self.assertExpected(output, prec=prec, strip_suffix=strip_suffix)
-                pass
+                self.assertExpected(output, model_name, prec=prec)
+                raise AssertionError
             except AssertionError:
                 # Unfortunately detection models are flaky due to the unstable sort
                 # in NMS. If matching across all outputs fails, use the same approach
                 # as in NMSTester.test_nms_cuda to see if this is caused by duplicate
                 # scores.
-                expected_file = self._get_expected_file(strip_suffix=strip_suffix)
+                expected_file = self._get_expected_file(model_name)
                 expected = torch.load(expected_file)
                 self.assertEqual(output[0]["scores"], expected[0]["scores"], prec=prec)
 
@@ -217,13 +214,13 @@ def compute_mean_std(tensor):
             return True  # Full validation performed
 
         full_validation = check_out(out)
-        self.check_jit_scriptable(model, ([x],), unwrapper=script_model_unwrapper.get(name, None))
+        self.check_jit_scriptable(model, ([x],), unwrapper=script_model_unwrapper.get(model_name, None))
 
         if dev == torch.device("cuda"):
             with torch.cuda.amp.autocast():
                 out = model(model_input)
                 # See autocast_flaky_numerics comment at top of file.
-                if name not in autocast_flaky_numerics:
+                if model_name not in autocast_flaky_numerics:
                     full_validation &= check_out(out)
 
         if not full_validation:
@@ -234,9 +231,9 @@ def compute_mean_std(tensor):
             warnings.warn(msg, RuntimeWarning)
             raise unittest.SkipTest(msg)
 
-    def _test_detection_model_validation(self, name):
+    def _test_detection_model_validation(self, model_name):
         set_rng_seed(0)
-        model = models.detection.__dict__[name](num_classes=50, pretrained_backbone=False)
+        model = models.detection.__dict__[model_name](num_classes=50, pretrained_backbone=False)
         input_shape = (3, 300, 300)
         x = [torch.rand(input_shape)]
 
@@ -437,7 +434,7 @@ def test_generalizedrcnn_transform_repr(self):
 @pytest.mark.parametrize('model_name', get_available_classification_models())
 @pytest.mark.parametrize('dev', _devs)
 def test_classification_model(model_name, dev):
-    input_shape = (1, 3, 224, 224) if model_name == 'inception_v3' else (1, 3, 299, 299)
+    input_shape = (1, 3, 299, 299) if model_name == 'inception_v3' else (1, 3, 224, 224)
     ModelTester()._test_classification_model(model_name, input_shape, dev)
 
 

From 33474eebda74604554c180ae2315947ee8ccc9bf Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Tue, 20 Apr 2021 15:07:26 +0100
Subject: [PATCH 06/10] cleaning + comment

---
 test/common_utils.py | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/test/common_utils.py b/test/common_utils.py
index d20231f10eb..be036d2fef4 100644
--- a/test/common_utils.py
+++ b/test/common_utils.py
@@ -100,7 +100,7 @@ def is_iterable(obj):
 class TestCase(unittest.TestCase):
     precision = 1e-5
 
-    def _get_expected_file(self, model_name=None):
+    def _get_expected_file(self, name=None):
         # NB: we take __file__ from the module that defined the test
         # class, so we place the expect directory where the test script
         # lives, NOT where test/common_utils.py lives.
@@ -111,7 +111,9 @@ def _get_expected_file(self, model_name=None):
             os.path.realpath(sys.modules[module_id].__file__),
             "expect")
 
-        expected_file = expected_file = os.path.join(expected_file_base, 'ModelTester.test_' + model_name)
+        # Note: for legacy reasons, the reference file names all had "ModelTest.test_" in their names
+        # We hardcode it here to avoid having to re-generate the reference files
+        expected_file = expected_file = os.path.join(expected_file_base, 'ModelTester.test_' + name)
         expected_file += "_expect.pkl"
 
         if not ACCEPT and not os.path.exists(expected_file):
@@ -122,7 +124,7 @@ def _get_expected_file(self, model_name=None):
 
         return expected_file
 
-    def assertExpected(self, output, model_name, prec=None):
+    def assertExpected(self, output, name, prec=None):
         r"""
         Test that a python value matches the recorded contents of a file
         derived from a model name. The value must be
@@ -131,7 +133,7 @@ def assertExpected(self, output, model_name, prec=None):
         as the test script. You can automatically update the recorded test
         output using --accept.
         """
-        expected_file = self._get_expected_file(model_name)
+        expected_file = self._get_expected_file(name)
 
         if ACCEPT:
             filename = {os.path.basename(expected_file)}

From d115c28679bbed42cc60f150ecb58beed3cd543b Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Tue, 20 Apr 2021 15:08:41 +0100
Subject: [PATCH 07/10] docs

---
 test/common_utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/test/common_utils.py b/test/common_utils.py
index be036d2fef4..3554e2d5c71 100644
--- a/test/common_utils.py
+++ b/test/common_utils.py
@@ -127,7 +127,7 @@ def _get_expected_file(self, name=None):
     def assertExpected(self, output, name, prec=None):
         r"""
         Test that a python value matches the recorded contents of a file
-        derived from a model name. The value must be
+        based on a "check" name. The value must be
         pickable with `torch.save`. This file
         is placed in the 'expect' directory in the same directory
         as the test script. You can automatically update the recorded test

From 0ef22d3334b60d07d7fe55b404deaa13c8fef5b3 Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Tue, 20 Apr 2021 15:12:34 +0100
Subject: [PATCH 08/10] void unnecessary changes

---
 test/test_models.py | 46 ++++++++++++++++++++++-----------------------
 1 file changed, 23 insertions(+), 23 deletions(-)

diff --git a/test/test_models.py b/test/test_models.py
index 89b9414df15..afbd7feee38 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -72,32 +72,32 @@ def get_available_video_models():
 
 
 class ModelTester(TestCase):
-    def _test_classification_model(self, model_name, input_shape, dev):
+    def _test_classification_model(self, name, input_shape, dev):
         set_rng_seed(0)
         # passing num_class equal to a number other than 1000 helps in making the test
         # more enforcing in nature
-        model = models.__dict__[model_name](num_classes=50)
+        model = models.__dict__[name](num_classes=50)
         model.eval().to(device=dev)
         # RNG always on CPU, to ensure x in cuda tests is bitwise identical to x in cpu tests
         x = torch.rand(input_shape).to(device=dev)
         out = model(x)
-        self.assertExpected(out.cpu(), model_name, prec=0.1)
+        self.assertExpected(out.cpu(), name, prec=0.1)
         self.assertEqual(out.shape[-1], 50)
-        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(model_name, None))
+        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(name, None))
 
         if dev == torch.device("cuda"):
             with torch.cuda.amp.autocast():
                 out = model(x)
                 # See autocast_flaky_numerics comment at top of file.
-                if model_name not in autocast_flaky_numerics:
-                    self.assertExpected(out.cpu(), model_name, prec=0.1)
+                if name not in autocast_flaky_numerics:
+                    self.assertExpected(out.cpu(), name, prec=0.1)
                 self.assertEqual(out.shape[-1], 50)
 
-    def _test_segmentation_model(self, model_name, dev):
+    def _test_segmentation_model(self, name, dev):
         set_rng_seed(0)
         # passing num_classes equal to a number other than 21 helps in making the test's
         # expected file size smaller
-        model = models.segmentation.__dict__[model_name](num_classes=10, pretrained_backbone=False)
+        model = models.segmentation.__dict__[name](num_classes=10, pretrained_backbone=False)
         model.eval().to(device=dev)
         input_shape = (1, 3, 32, 32)
         # RNG always on CPU, to ensure x in cuda tests is bitwise identical to x in cpu tests
@@ -110,12 +110,12 @@ def check_out(out):
                 # We first try to assert the entire output if possible. This is not
                 # only the best way to assert results but also handles the cases
                 # where we need to create a new expected result.
-                self.assertExpected(out.cpu(), model_name, prec=prec)
+                self.assertExpected(out.cpu(), name, prec=prec)
             except AssertionError:
                 # Unfortunately some segmentation models are flaky with autocast
                 # so instead of validating the probability scores, check that the class
                 # predictions match.
-                expected_file = self._get_expected_file(model_name)
+                expected_file = self._get_expected_file(name)
                 expected = torch.load(expected_file)
                 self.assertEqual(out.argmax(dim=1), expected.argmax(dim=1), prec=prec)
                 return False  # Partial validation performed
@@ -124,13 +124,13 @@ def check_out(out):
 
         full_validation = check_out(out)
 
-        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(model_name, None))
+        self.check_jit_scriptable(model, (x,), unwrapper=script_model_unwrapper.get(name, None))
 
         if dev == torch.device("cuda"):
             with torch.cuda.amp.autocast():
                 out = model(x)["out"]
                 # See autocast_flaky_numerics comment at top of file.
-                if model_name not in autocast_flaky_numerics:
+                if name not in autocast_flaky_numerics:
                     full_validation &= check_out(out)
 
         if not full_validation:
@@ -141,18 +141,18 @@ def check_out(out):
             warnings.warn(msg, RuntimeWarning)
             raise unittest.SkipTest(msg)
 
-    def _test_detection_model(self, model_name, dev):
+    def _test_detection_model(self, name, dev):
         set_rng_seed(0)
         kwargs = {}
-        if "retinanet" in model_name:
+        if "retinanet" in name:
             # Reduce the default threshold to ensure the returned boxes are not empty.
             kwargs["score_thresh"] = 0.01
-        elif "fasterrcnn_mobilenet_v3_large" in model_name:
+        elif "fasterrcnn_mobilenet_v3_large" in name:
             kwargs["box_score_thresh"] = 0.02076
-            if "fasterrcnn_mobilenet_v3_large_320_fpn" in model_name:
+            if "fasterrcnn_mobilenet_v3_large_320_fpn" in name:
                 kwargs["rpn_pre_nms_top_n_test"] = 1000
                 kwargs["rpn_post_nms_top_n_test"] = 1000
-        model = models.detection.__dict__[model_name](num_classes=50, pretrained_backbone=False, **kwargs)
+        model = models.detection.__dict__[name](num_classes=50, pretrained_backbone=False, **kwargs)
         model.eval().to(device=dev)
         input_shape = (3, 300, 300)
         # RNG always on CPU, to ensure x in cuda tests is bitwise identical to x in cpu tests
@@ -194,14 +194,14 @@ def compute_mean_std(tensor):
                 # We first try to assert the entire output if possible. This is not
                 # only the best way to assert results but also handles the cases
                 # where we need to create a new expected result.
-                self.assertExpected(output, model_name, prec=prec)
+                self.assertExpected(output, name, prec=prec)
                 raise AssertionError
             except AssertionError:
                 # Unfortunately detection models are flaky due to the unstable sort
                 # in NMS. If matching across all outputs fails, use the same approach
                 # as in NMSTester.test_nms_cuda to see if this is caused by duplicate
                 # scores.
-                expected_file = self._get_expected_file(model_name)
+                expected_file = self._get_expected_file(name)
                 expected = torch.load(expected_file)
                 self.assertEqual(output[0]["scores"], expected[0]["scores"], prec=prec)
 
@@ -214,13 +214,13 @@ def compute_mean_std(tensor):
             return True  # Full validation performed
 
         full_validation = check_out(out)
-        self.check_jit_scriptable(model, ([x],), unwrapper=script_model_unwrapper.get(model_name, None))
+        self.check_jit_scriptable(model, ([x],), unwrapper=script_model_unwrapper.get(name, None))
 
         if dev == torch.device("cuda"):
             with torch.cuda.amp.autocast():
                 out = model(model_input)
                 # See autocast_flaky_numerics comment at top of file.
-                if model_name not in autocast_flaky_numerics:
+                if name not in autocast_flaky_numerics:
                     full_validation &= check_out(out)
 
         if not full_validation:
@@ -231,9 +231,9 @@ def compute_mean_std(tensor):
             warnings.warn(msg, RuntimeWarning)
             raise unittest.SkipTest(msg)
 
-    def _test_detection_model_validation(self, model_name):
+    def _test_detection_model_validation(self, name):
         set_rng_seed(0)
-        model = models.detection.__dict__[model_name](num_classes=50, pretrained_backbone=False)
+        model = models.detection.__dict__[name](num_classes=50, pretrained_backbone=False)
         input_shape = (3, 300, 300)
         x = [torch.rand(input_shape)]
 

From 20b5397dc9ee0568497c197eda1a292538348629 Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Tue, 20 Apr 2021 16:22:41 +0100
Subject: [PATCH 09/10] r2plus1d_18 seems  to segfault on linux gpu??

---
 test/test_models.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/test/test_models.py b/test/test_models.py
index afbd7feee38..41bc3c16975 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -458,6 +458,8 @@ def test_detection_model_validation(model_name):
 @pytest.mark.parametrize('model_name', get_available_video_models())
 @pytest.mark.parametrize('dev', _devs)
 def test_video_model(model_name, dev):
+    if 'r2plus1d_18' in model_name:
+        return
     ModelTester()._test_video_model(model_name, dev)
 
 

From b08352439c3ab87ae5f75410003ffcb140e539b6 Mon Sep 17 00:00:00 2001
From: Nicolas Hug <nicolashug@fb.com>
Date: Wed, 21 Apr 2021 07:52:51 +0100
Subject: [PATCH 10/10] put back test, failure is unrelated

---
 test/test_models.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/test/test_models.py b/test/test_models.py
index 41bc3c16975..afbd7feee38 100644
--- a/test/test_models.py
+++ b/test/test_models.py
@@ -458,8 +458,6 @@ def test_detection_model_validation(model_name):
 @pytest.mark.parametrize('model_name', get_available_video_models())
 @pytest.mark.parametrize('dev', _devs)
 def test_video_model(model_name, dev):
-    if 'r2plus1d_18' in model_name:
-        return
     ModelTester()._test_video_model(model_name, dev)