test/jit/test_profiler.py

*da0073e9SAndroid Build Coastguard Worker# Owner(s): ["oncall: jit"]
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Workerimport os
*da0073e9SAndroid Build Coastguard Workerimport sys
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Workerimport torch
*da0073e9SAndroid Build Coastguard Workerfrom torch.testing._internal.common_utils import skipIfTorchDynamo
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker# Make the helper files in test/ importable
*da0073e9SAndroid Build Coastguard Workerpytorch_test_dir = os.path.dirname(os.path.dirname(os.path.realpath(__file__)))
*da0073e9SAndroid Build Coastguard Workersys.path.append(pytorch_test_dir)
*da0073e9SAndroid Build Coastguard Workerfrom torch.testing._internal.jit_utils import FileCheck, JitTestCase, warmup_backward
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Workerif __name__ == "__main__":
*da0073e9SAndroid Build Coastguard Worker    raise RuntimeError(
*da0073e9SAndroid Build Coastguard Worker        "This test file is not meant to be run directly, use:\n\n"
*da0073e9SAndroid Build Coastguard Worker        "\tpython test/test_jit.py TESTNAME\n\n"
*da0073e9SAndroid Build Coastguard Worker        "instead."
*da0073e9SAndroid Build Coastguard Worker    )
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker@skipIfTorchDynamo()
*da0073e9SAndroid Build Coastguard Workerclass TestProfiler(JitTestCase):
*da0073e9SAndroid Build Coastguard Worker    def setUp(self):
*da0073e9SAndroid Build Coastguard Worker        self.prev_exec = torch._C._jit_set_profiling_executor(True)
*da0073e9SAndroid Build Coastguard Worker        self.prev_profiling = torch._C._get_graph_executor_optimize(True)
*da0073e9SAndroid Build Coastguard Worker        self.inline_autodiff = torch._C._debug_set_autodiff_subgraph_inlining(False)
*da0073e9SAndroid Build Coastguard Worker        self.texpr_fuser_state = torch._C._jit_texpr_fuser_enabled()
*da0073e9SAndroid Build Coastguard Worker        self.can_fuse_on_cpu = torch._C._jit_can_fuse_on_cpu()
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_set_texpr_fuser_enabled(True)
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_override_can_fuse_on_cpu(True)
*da0073e9SAndroid Build Coastguard Worker        self.default_dtype = torch.get_default_dtype()
*da0073e9SAndroid Build Coastguard Worker        self.old_reduction_enabled = torch._C._jit_set_texpr_reductions_enabled(True)
*da0073e9SAndroid Build Coastguard Worker        torch.set_default_dtype(torch.double)
*da0073e9SAndroid Build Coastguard Worker        self.old_fusion_inlining = torch._C._debug_get_fusion_group_inlining()
*da0073e9SAndroid Build Coastguard Worker        torch._C._debug_set_fusion_group_inlining(False)
*da0073e9SAndroid Build Coastguard Worker        self.old_te_must_use_llvm_cpu = torch._C._jit_get_te_must_use_llvm_cpu()
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_set_te_must_use_llvm_cpu(False)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def tearDown(self):
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_set_profiling_executor(self.prev_exec)
*da0073e9SAndroid Build Coastguard Worker        torch._C._get_graph_executor_optimize(self.prev_profiling)
*da0073e9SAndroid Build Coastguard Worker        torch._C._debug_set_autodiff_subgraph_inlining(self.inline_autodiff)
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_set_texpr_fuser_enabled(self.texpr_fuser_state)
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_override_can_fuse_on_cpu(self.can_fuse_on_cpu)
*da0073e9SAndroid Build Coastguard Worker        torch.set_default_dtype(self.default_dtype)
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_set_texpr_reductions_enabled(self.old_reduction_enabled)
*da0073e9SAndroid Build Coastguard Worker        torch._C._debug_set_fusion_group_inlining(self.old_fusion_inlining)
*da0073e9SAndroid Build Coastguard Worker        torch._C._jit_set_te_must_use_llvm_cpu(self.old_te_must_use_llvm_cpu)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_tensor_type_not_determined_by_inputs(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def scalar_type_input(x, y, z):
*da0073e9SAndroid Build Coastguard Worker            return x + y + 4 + z.item()
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.tensor([2, 2])
*da0073e9SAndroid Build Coastguard Worker        scalar_type_input(x, x, torch.tensor(1))
*da0073e9SAndroid Build Coastguard Worker        scalar_type_input(x, x, torch.tensor(1))
*da0073e9SAndroid Build Coastguard Worker        scalar_type_input(x, x, torch.tensor(1.0))
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        # item & add should not get pulled into the fusion group -
*da0073e9SAndroid Build Coastguard Worker        # we expect to see Fusion Group (item / add) Fusion Group in ir dump
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("TensorExpr").check("Scalar = aten::item").check_next(
*da0073e9SAndroid Build Coastguard Worker            "Tensor = aten::add"
*da0073e9SAndroid Build Coastguard Worker        ).check("TensorExpr").run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def non_const_dtype(x, y, cond: bool):
*da0073e9SAndroid Build Coastguard Worker            dtype = torch.int16 if cond else torch.int32
*da0073e9SAndroid Build Coastguard Worker            return (x + y + 3).sum(dtype=dtype)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        non_const_dtype(x, x, True)
*da0073e9SAndroid Build Coastguard Worker        non_const_dtype(x, x, True)
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        # because dtype is non-const, sum should not get pulled into the Fusion Group
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("TensorExpr").check("TensorExpr").check_not("aten::sum").run(
*da0073e9SAndroid Build Coastguard Worker            g
*da0073e9SAndroid Build Coastguard Worker        )
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_specialize_backward(self):
*da0073e9SAndroid Build Coastguard Worker        def test_fuse(a, b):
*da0073e9SAndroid Build Coastguard Worker            c = a * b
*da0073e9SAndroid Build Coastguard Worker            d = c * b
*da0073e9SAndroid Build Coastguard Worker            return d
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        test_fuse.__disable_jit_function_caching__ = True
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        scripted_f = torch.jit.script(test_fuse)
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones(1, requires_grad=True)
*da0073e9SAndroid Build Coastguard Worker        y = torch.ones(1, requires_grad=True)
*da0073e9SAndroid Build Coastguard Worker        scripted_f(x, y)
*da0073e9SAndroid Build Coastguard Worker        b = scripted_f(x, y)
*da0073e9SAndroid Build Coastguard Worker        warmup_backward(b)
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        # Backward has an if node guarding specializations,
*da0073e9SAndroid Build Coastguard Worker        # within the if node true block there is only one if node
*da0073e9SAndroid Build Coastguard Worker        # that guards a tensorexpr group
*da0073e9SAndroid Build Coastguard Worker        optimized_block = next(g.findNode("prim::If").blocks())
*da0073e9SAndroid Build Coastguard Worker        if_nodes = list(optimized_block.findAllNodes("prim::If"))
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        self.assertEqual(len(if_nodes), 1)
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("Group[Subgraph").run(str(if_nodes[0]))
*da0073e9SAndroid Build Coastguard Worker        # no broadcasts occurred, sum_to_size have been specialized out
*da0073e9SAndroid Build Coastguard Worker        self.assertIsNone(optimized_block.findNode("aten::_grad_sum_to_size"))
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        broadcast_f = torch.jit.script(test_fuse)
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones([2, 2], requires_grad=True)
*da0073e9SAndroid Build Coastguard Worker        y = torch.ones([1], requires_grad=True)
*da0073e9SAndroid Build Coastguard Worker        broadcast_f(x, y)
*da0073e9SAndroid Build Coastguard Worker        b = broadcast_f(x, y)
*da0073e9SAndroid Build Coastguard Worker        b.backward(torch.ones([2, 2], dtype=torch.float), retain_graph=True)
*da0073e9SAndroid Build Coastguard Worker        b.backward(torch.ones([2, 2], dtype=torch.float))
*da0073e9SAndroid Build Coastguard Worker        # warmup_backward(b, torch.ones([2, 2], dtype=torch.float))
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        optimized_block = next(g.findNode("prim::If").blocks())
*da0073e9SAndroid Build Coastguard Worker        # broadcasts occurred, currently expect to see aten::_grad_sum_to_size
*da0073e9SAndroid Build Coastguard Worker        self.assertIsNotNone(optimized_block.findNode("aten::_grad_sum_to_size"))
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_specialized_types(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def test_fuse(a, b):
*da0073e9SAndroid Build Coastguard Worker            c = a * b
*da0073e9SAndroid Build Coastguard Worker            d = c * b
*da0073e9SAndroid Build Coastguard Worker            return d
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.tensor([0.5])
*da0073e9SAndroid Build Coastguard Worker        for _ in range(3):
*da0073e9SAndroid Build Coastguard Worker            test_fuse(x, x)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        # Types should remain specialized for typecheck outputs & fusion outputs
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("Double(").check_same("prim::TypeCheck").check_same(
*da0073e9SAndroid Build Coastguard Worker            "\n"
*da0073e9SAndroid Build Coastguard Worker        ).check("Double").check_same("TensorExpr").run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        # other outputs should not be specialized
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("Tensor = prim::If").run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_aliasing_merge(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def foo(a, b):
*da0073e9SAndroid Build Coastguard Worker            c = a * b
*da0073e9SAndroid Build Coastguard Worker            d = c * b
*da0073e9SAndroid Build Coastguard Worker            d.add_(b)
*da0073e9SAndroid Build Coastguard Worker            e = d * b
*da0073e9SAndroid Build Coastguard Worker            return d + e
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones(1)
*da0073e9SAndroid Build Coastguard Worker        y = torch.ones(1)
*da0073e9SAndroid Build Coastguard Worker        foo(x, y)
*da0073e9SAndroid Build Coastguard Worker        b = foo(x, y)
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        self.assertEqual(len(list(g.findAllNodes("prim::TypeCheck"))), 2)
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("TensorExpr").check("aten::add_").check("TensorExpr").run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_use_not_profiled(self):
*da0073e9SAndroid Build Coastguard Worker        def foo(t1, t2, t3, t4, t: float):
*da0073e9SAndroid Build Coastguard Worker            h = t1 + t2 + t3 + t4
*da0073e9SAndroid Build Coastguard Worker            if t > 0.5:
*da0073e9SAndroid Build Coastguard Worker                # Putting a use of t1 in a never-executed conditional prevents
*da0073e9SAndroid Build Coastguard Worker                return t1 + 1
*da0073e9SAndroid Build Coastguard Worker            return h
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        t = torch.rand(8, dtype=torch.float)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        foo_script = torch.jit.script(foo)
*da0073e9SAndroid Build Coastguard Worker        for _ in range(torch._C._jit_get_num_profiled_runs() + 1):
*da0073e9SAndroid Build Coastguard Worker            foo_script(t, t, t, t, 0.1)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        self.assertEqual(foo(t, t, t, t, 0.1), foo_script(t, t, t, t, 0.1))
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        # all adds fused
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("graph").check_not("aten::add").check("prim::If").run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_not_fusing_scalar_ops(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def foo(x: int, y: int):
*da0073e9SAndroid Build Coastguard Worker            return x + y + 2 + 4 + 5 + 6
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        foo(1, 2)
*da0073e9SAndroid Build Coastguard Worker        foo(2, 3)
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check_not("TensorExpr").run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_not_optimizing_property(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def foo(x, y):
*da0073e9SAndroid Build Coastguard Worker            return x + y + 1 + 2 + 3, x.size()
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones(1)
*da0073e9SAndroid Build Coastguard Worker        foo(x, x)
*da0073e9SAndroid Build Coastguard Worker        foo(x, x)
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("aten::size").run(g)
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones([2, 3, 5])
*da0073e9SAndroid Build Coastguard Worker        self.assertEqual(foo(x, x), (x + x + 1 + 2 + 3, x.size()))
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_fallback_graph_not_specialized(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def foo(a, b):
*da0073e9SAndroid Build Coastguard Worker            c = a * b
*da0073e9SAndroid Build Coastguard Worker            d = c * b
*da0073e9SAndroid Build Coastguard Worker            e = d * b
*da0073e9SAndroid Build Coastguard Worker            return d + e
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones(1)
*da0073e9SAndroid Build Coastguard Worker        y = torch.ones(1)
*da0073e9SAndroid Build Coastguard Worker        foo(x, y)
*da0073e9SAndroid Build Coastguard Worker        foo(x, y)
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("CallFunction").check_next("Tensor = prim::TupleUnpack").run(
*da0073e9SAndroid Build Coastguard Worker            g
*da0073e9SAndroid Build Coastguard Worker        )
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_autograd_fallback_graph(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def foo(a, b):
*da0073e9SAndroid Build Coastguard Worker            c = a * b
*da0073e9SAndroid Build Coastguard Worker            d = c * b
*da0073e9SAndroid Build Coastguard Worker            e = d * b
*da0073e9SAndroid Build Coastguard Worker            return d + e
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones(1, requires_grad=True)
*da0073e9SAndroid Build Coastguard Worker        y = torch.ones(1, requires_grad=True)
*da0073e9SAndroid Build Coastguard Worker        foo(x, y)
*da0073e9SAndroid Build Coastguard Worker        b = foo(x, y)
*da0073e9SAndroid Build Coastguard Worker        b.backward(torch.ones([1], dtype=torch.float), retain_graph=True)
*da0073e9SAndroid Build Coastguard Worker        b.backward(torch.ones([1], dtype=torch.float))
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check("fallback_function").check_next("CallFunction").run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_tensor_constant(self):
*da0073e9SAndroid Build Coastguard Worker        def foo(a, b):
*da0073e9SAndroid Build Coastguard Worker            return a + b + torch.tensor([2])
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones(1, requires_grad=False)
*da0073e9SAndroid Build Coastguard Worker        foo_script = torch.jit.script(foo)
*da0073e9SAndroid Build Coastguard Worker        foo_script(x, x)
*da0073e9SAndroid Build Coastguard Worker        foo_script(x, x)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        self.assertEqual(foo_script(x, x), foo(x, x))
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check_count("aten::add", 2, exactly=True).run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_local_fusion_strategy(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def foo(x):
*da0073e9SAndroid Build Coastguard Worker            return x + x + x
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        torch.jit.set_fusion_strategy([("STATIC", 1)])
*da0073e9SAndroid Build Coastguard Worker        for _ in range(3):
*da0073e9SAndroid Build Coastguard Worker            foo(torch.rand([10]))
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        torch.jit.set_fusion_strategy([("STATIC", 10)])
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        for i in range(10):
*da0073e9SAndroid Build Coastguard Worker            foo(torch.rand([i]))
*da0073e9SAndroid Build Coastguard Worker            foo(torch.rand([i]))
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        FileCheck().check_count(":TensorExprGroup", 2, exactly=True).run(g)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker    def test_iterative_fusion(self):
*da0073e9SAndroid Build Coastguard Worker        @torch.jit.script
*da0073e9SAndroid Build Coastguard Worker        def foo(a, b, c, d):
*da0073e9SAndroid Build Coastguard Worker            a = a + b
*da0073e9SAndroid Build Coastguard Worker            b.add_(3)
*da0073e9SAndroid Build Coastguard Worker            c = c + b + d
*da0073e9SAndroid Build Coastguard Worker            a = a + 1
*da0073e9SAndroid Build Coastguard Worker            return a, c
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        x = torch.ones(1, requires_grad=False)
*da0073e9SAndroid Build Coastguard Worker        foo(x, x, x, x)
*da0073e9SAndroid Build Coastguard Worker        foo(x, x, x, x)
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        # when we iterate through the block, we will start
*da0073e9SAndroid Build Coastguard Worker        # by fusing a = a + b with a = a + 1
*da0073e9SAndroid Build Coastguard Worker        # if we were to continue iteration from that fusion point,
*da0073e9SAndroid Build Coastguard Worker        # would miss the fusion opportunity of c = c + d + b
*da0073e9SAndroid Build Coastguard Worker
*da0073e9SAndroid Build Coastguard Worker        g = torch.jit.last_executed_optimized_graph()
*da0073e9SAndroid Build Coastguard Worker        self.assertEqual(len(list(g.findAllNodes("prim::TensorExprGroup"))), 2)