Squashed commit of the following:

awwong1 · awwong1 · commit 8b52d15862c7 · 2020-11-26T10:49:25.000-07:00
commit 08d38b3 Author: Alexander Wong <alex@udia.ca> Date: Thu Nov 26 10:48:46 2020 -0700 CircleCI badge to README.md commit 64a3f8d Author: Alexander Wong <alex@udia.ca> Date: Thu Nov 26 10:42:32 2020 -0700 Enforce requirements versions for test, reduced comparison strictness commit fdcf493 Author: Alexander Wong <alex@udia.ca> Date: Thu Nov 26 10:30:07 2020 -0700 Test references updated to be consistent on development machine - torch==1.7.0 - torchvision==0.8.1 - TITAN Xp (12180MiB, CUDA Version 11.0, Driver Version: 450.80.02) commit 654c87a Author: Alexander Wong <alex@udia.ca> Date: Thu Nov 26 09:45:42 2020 -0700 CircleCI test configuration update commit a8ecbff Author: Alexander Wong <alex@udia.ca> Date: Thu Nov 26 09:39:12 2020 -0700 Add .circleci/config.yml
diff --git a/.circleci/config.yml b/.circleci/config.yml
@@ -0,0 +1,23 @@
+version: 2.1
+
+orbs:
+  python: circleci/python@1.2.1
+
+jobs:
+  build-and-test:
+    executor: python/default
+    steps:
+      - checkout
+      - python/install-packages:
+          pkg-manager: pip
+      - python/install-packages:
+          pip-dependency-file: requirements.txt
+          pkg-manager: pip
+      - run:
+          command: python3 -m unittest discover
+          name: Test
+
+workflows:
+  main:
+    jobs:
+      - build-and-test
diff --git a/README.md b/README.md
@@ -1,6 +1,7 @@
 # torchprof
 
 [![PyPI version](https://badge.fury.io/py/torchprof.svg)](https://pypi.org/project/torchprof/)
+[![CircleCI](https://circleci.com/gh/awwong1/torchprof.svg?style=svg)](https://circleci.com/gh/awwong1/torchprof)
 
 A minimal dependency library for layer-by-layer profiling of Pytorch models.
 
diff --git a/requirements.txt b/requirements.txt
@@ -1,2 +1,2 @@
-torch>=1.1.0
-torchvision>=0.3.0
+torch==1.7.0
+torchvision==0.8.1
diff --git a/tests/test_profile.py b/tests/test_profile.py
@@ -34,97 +34,254 @@ class TestProfile(unittest.TestCase):
     ]
 
     alexnet_cpu_ops = [
-        None,
-        None,
-        (
-            "conv2d",
-            "convolution",
-            "_convolution",
-            "contiguous",
-            "contiguous",
-            "contiguous",
-            "mkldnn_convolution",
-        ),
-        ("relu_",),
-        ("max_pool2d", "max_pool2d_with_indices"),
-        (
-            "conv2d",
-            "convolution",
-            "_convolution",
-            "contiguous",
-            "contiguous",
-            "contiguous",
-            "mkldnn_convolution",
-        ),
-        ("relu_",),
-        ("max_pool2d", "max_pool2d_with_indices"),
-        (
-            "conv2d",
-            "convolution",
-            "_convolution",
-            "contiguous",
-            "contiguous",
-            "contiguous",
-            "mkldnn_convolution",
-        ),
-        ("relu_",),
-        (
-            "conv2d",
-            "convolution",
-            "_convolution",
-            "contiguous",
-            "contiguous",
-            "contiguous",
-            "mkldnn_convolution",
-        ),
-        ("relu_",),
-        (
-            "conv2d",
-            "convolution",
-            "_convolution",
-            "contiguous",
-            "contiguous",
-            "contiguous",
-            "mkldnn_convolution",
-        ),
-        ("relu_",),
-        ("max_pool2d", "max_pool2d_with_indices"),
-        ("adaptive_avg_pool2d", "_adaptive_avg_pool2d"),
-        None,
-        ("dropout", "empty_like", "empty", "bernoulli_", "div_", "mul"),
-        ("unsigned short", "addmm"),
-        ("relu_",),
-        ("dropout", "empty_like", "empty", "bernoulli_", "div_", "mul"),
-        ("unsigned short", "addmm"),
-        ("relu_",),
-        ("unsigned short", "addmm"),
+        None,  # 0
+        None,  # 1
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::mkldnn_convolution",
+            "aten::as_strided_",
+        ),  # 2
+        ("aten::relu_", "aten::threshold_"),  # 3
+        (
+            "aten::max_pool2d",
+            "aten::max_pool2d_with_indices",
+            "aten::contiguous",
+        ),  # 4
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::mkldnn_convolution",
+            "aten::as_strided_",
+        ),  # 5
+        ("aten::relu_", "aten::threshold_"),  # 6
+        (
+            "aten::max_pool2d",
+            "aten::max_pool2d_with_indices",
+            "aten::contiguous",
+        ),  # 7
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::mkldnn_convolution",
+            "aten::as_strided_",
+        ),  # 8
+        ("aten::relu_", "aten::threshold_"),  # 9
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::mkldnn_convolution",
+            "aten::as_strided_",
+        ),  # 10
+        ("aten::relu_", "aten::threshold_"),  # 11
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::mkldnn_convolution",
+            "aten::as_strided_",
+        ),  # 12
+        ("aten::relu_", "aten::threshold_"),  # 13
+        (
+            "aten::max_pool2d",
+            "aten::max_pool2d_with_indices",
+            "aten::contiguous",
+        ),  # 14
+        (
+            "aten::adaptive_avg_pool2d",
+            "aten::_adaptive_avg_pool2d",
+        ),  # 15
+        None,  # 16
+        (
+            "aten::dropout",
+            "aten::empty_like",
+            "aten::bernoulli_",
+            "aten::div_",
+            "aten::to",
+            "aten::empty_strided",
+            "aten::mul",
+        ),  # 17
+        (
+            "aten::t",
+            "aten::transpose",
+            "aten::as_strided",
+            "aten::addmm",
+            "aten::expand",
+            "aten::as_strided",
+        ),  # 18
+        ("aten::relu_", "aten::threshold_"),  # 19
+        (
+            "aten::dropout",
+            "aten::empty_like",
+            "aten::bernoulli_",
+            "aten::div_",
+            "aten::to",
+            "aten::empty_strided",
+            "aten::mul",
+        ),  # 20
+        (
+            "aten::t",
+            "aten::transpose",
+            "aten::as_strided",
+            "aten::addmm",
+            "aten::expand",
+            "aten::as_strided",
+        ),  # 21
+        ("aten::relu_", "aten::threshold_"),  # 22
+        (
+            "aten::t",
+            "aten::transpose",
+            "aten::as_strided",
+            "aten::addmm",
+            "aten::expand",
+            "aten::as_strided",
+        ),  # 23
     ]
 
     alexnet_gpu_ops = (
-        None,
-        None,
-        ("conv2d", "convolution", "_convolution", "contiguous", "cudnn_convolution"),
-        ("relu_",),
-        ("max_pool2d", "max_pool2d_with_indices"),
-        ("conv2d", "convolution", "_convolution", "contiguous", "cudnn_convolution"),
-        ("relu_",),
-        ("max_pool2d", "max_pool2d_with_indices"),
-        ("conv2d", "convolution", "_convolution", "contiguous", "cudnn_convolution"),
-        ("relu_",),
-        ("conv2d", "convolution", "_convolution", "contiguous", "cudnn_convolution"),
-        ("relu_",),
-        ("conv2d", "convolution", "_convolution", "contiguous", "cudnn_convolution"),
-        ("relu_",),
-        ("max_pool2d", "max_pool2d_with_indices"),
-        ("adaptive_avg_pool2d", "_adaptive_avg_pool2d"),
-        None,
-        ("dropout", "_fused_dropout"),
-        ("unsigned short", "addmm"),
-        ("relu_",),
-        ("dropout", "_fused_dropout"),
-        ("unsigned short", "addmm"),
-        ("relu_",),
-        ("unsigned short", "addmm"),
+        None,  # 0
+        None,  # 1
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::cudnn_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::reshape",
+            "aten::view",
+            "aten::add_",
+        ),  # 2
+        ("aten::relu_", "aten::threshold_"),  # 3
+        (
+            "aten::max_pool2d",
+            "aten::max_pool2d_with_indices",
+            "aten::contiguous",
+        ),  # 4
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::cudnn_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::reshape",
+            "aten::view",
+            "aten::add_",
+        ),  # 5
+        ("aten::relu_", "aten::threshold_"),  # 6
+        (
+            "aten::max_pool2d",
+            "aten::max_pool2d_with_indices",
+            "aten::contiguous",
+        ),  # 7
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::cudnn_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::reshape",
+            "aten::view",
+            "aten::add_",
+        ),  # 8
+        ("aten::relu_", "aten::threshold_"),  # 9
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::cudnn_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::reshape",
+            "aten::view",
+            "aten::add_",
+        ),  # 10
+        ("aten::relu_", "aten::threshold_"),  # 11
+        (
+            "aten::conv2d",
+            "aten::convolution",
+            "aten::_convolution",
+            "aten::contiguous",
+            "aten::cudnn_convolution",
+            "aten::contiguous",
+            "aten::contiguous",
+            "aten::reshape",
+            "aten::view",
+            "aten::add_",
+        ),  # 12
+        ("aten::relu_", "aten::threshold_"),  # 13
+        (
+            "aten::max_pool2d",
+            "aten::max_pool2d_with_indices",
+            "aten::contiguous",
+        ),  # 14
+        (
+            "aten::adaptive_avg_pool2d",
+            "aten::_adaptive_avg_pool2d",
+            "aten::contiguous",
+        ),  # 15
+        None,  # 16
+        (
+            "aten::dropout",
+            "aten::_fused_dropout",
+            "aten::empty_like",
+        ),  # 17
+        (
+            "aten::t",
+            "aten::transpose",
+            "aten::as_strided",
+            "aten::addmm",
+            "aten::expand",
+            "aten::as_strided",
+        ),  # 18
+        ("aten::relu_", "aten::threshold_"),  # 19
+        (
+            "aten::dropout",
+            "aten::_fused_dropout",
+            "aten::empty_like",
+        ),  # 20
+        (
+            "aten::t",
+            "aten::transpose",
+            "aten::as_strided",
+            "aten::addmm",
+            "aten::expand",
+            "aten::as_strided",
+        ),  # 21
+        ("aten::relu_", "aten::threshold_"),  # 22
+        (
+            "aten::t",
+            "aten::transpose",
+            "aten::as_strided",
+            "aten::addmm",
+            "aten::expand",
+            "aten::as_strided",
+        ),  # 23
     )
 
     def test_cpu_profile_structure(self):
@@ -155,7 +312,13 @@ def _profile_structure(self, model, x, use_cuda=False, alexnet_ops=[]):
                 self.assertEqual(len(event_lists), 1)
                 event_names = tuple(e.name for e in event_lists[0])
                 # profiler returned order is not deterministic
-                self.assertEqual(sorted(event_names), sorted(alexnet_ops[layer_idx]))
+                try:
+                    self.assertTrue(
+                        all(event_name in event_names for event_name in alexnet_ops[layer_idx]),
+                        f"Layer {layer_idx} received {event_names}, old {alexnet_ops[layer_idx]}",
+                    )
+                except IndexError:
+                    self.assertTrue(False, f"Layer {layer_idx} received {event_names}")
             else:
                 # non leaf nodes should not have event_list values
                 self.assertEqual(len(event_lists), 0)