Delete torch._functorch.config.use_dynamic_shapes

ezyang · ezyang · commit 0ee6bde2fd42 · 2023-03-06T07:29:17.000-08:00
As requested in #95975 (comment) Signed-off-by: Edward Z. Yang <ezyang@meta.com> [ghstack-poisoned]
diff --git a/test/functorch/test_aotdispatch.py b/test/functorch/test_aotdispatch.py
@@ -245,6 +245,7 @@ def verify_aot_autograd(
         *,
         test_mutation: bool = False,
         decompositions: Optional[Dict] = None,
+        dynamic: bool = False,
     ):
         for keep_input_mutations in [True, False]:
             # Some tests pass in a callable for inp, to generate the inputs
@@ -294,15 +295,17 @@ def verify_aot_autograd(
                     fw_compiler=partial(extract_graph, graph_cell=fw_graph_cell),
                     bw_compiler=nop,
                     decompositions=decompositions,
-                    keep_inference_input_mutations=keep_input_mutations
+                    keep_inference_input_mutations=keep_input_mutations,
+                    dynamic=dynamic
                 )
             else:
                 compiled_f = aot_function(
                     f,
                     fw_compiler=partial(extract_graph, graph_cell=fw_graph_cell),
                     bw_compiler=nop,
                     decompositions=decompositions,
-                    keep_inference_input_mutations=keep_input_mutations
+                    keep_inference_input_mutations=keep_input_mutations,
+                    dynamic=dynamic
                 )
             ref_out, ref_grad = outs_and_grads(f, graph_inps, inp)
             test_out, test_grad = outs_and_grads(compiled_f, graph_inps_copy, inp_copy)
@@ -366,21 +369,17 @@ def f(a, b):
         self.verify_aot_autograd(f, inp)
 
     # Test for bug occurring at the intersection of fake tensors & functionalization.
-    @patch("torch._functorch.config.use_dynamic_shapes", True)
-    @patch("torch._functorch.config.use_fake_tensor", True)
     def test_squeeze_mutation(self):
         def f(a):
             b = a.clone().squeeze(-1)
             b.add_(1.)
             return a + b
 
         inp = [torch.randn(3, 1, requires_grad=True)]
-        self.verify_aot_autograd(f, inp)
+        self.verify_aot_autograd(f, inp, dynamic=True)
         inp = [torch.randn(3, 1, requires_grad=False)]
-        self.verify_aot_autograd(f, inp)
+        self.verify_aot_autograd(f, inp, dynamic=True)
 
-    @patch("torch._functorch.config.use_dynamic_shapes", True)
-    @patch("torch._functorch.config.use_fake_tensor", True)
     def test_embedding_bag_view(self):
         # Backwards pass tries to wrap a sparse tensor in a FunctionalTensorWrapper;
         # test that this works even though the sparse tensor has no storage.
@@ -395,7 +394,7 @@ def forward(self, x, y):
 
         x = torch.arange(3)
         y = torch.arange(3)
-        self.verify_aot_autograd(F(), [x, y])
+        self.verify_aot_autograd(F(), [x, y], dynamic=True)
 
     @patch("functorch.compile.config.use_fake_tensor", True)
     def test_input_mutation_simple(self):
@@ -1714,8 +1713,6 @@ def bn(x):
         for a, b in zip(ref, res):
             assert torch.allclose(a, b)
 
-    @patch("functorch.compile.config.use_dynamic_shapes", True)
-    @patch("functorch.compile.config.use_fake_tensor", True)
     def test_output_op_depending_on_symint(self):
         """
         It won't be obvious from reading this test what it's testing for.  We should probably make it into a more
@@ -1738,12 +1735,10 @@ def f(x):
         # TODO: assert outputs of fwd graph trace to correct symint
 
         # e2e test that fails without symint clone fix
-        af = aot_function(f, nop, partition_fn=partial(min_cut_rematerialization_partition, compiler="inductor"))
+        af = aot_function(f, nop, partition_fn=partial(min_cut_rematerialization_partition, compiler="inductor"), dynamic=True)
         out = af(inp)
         self.assertEqual(out, f(inp))
 
-    @patch("functorch.compile.config.use_dynamic_shapes", True)
-    @patch("functorch.compile.config.use_fake_tensor", True)
     def test_default_partitioner_saves_symints_not_tensors_for_bw(self):
         """
         In this test, the important thing is that primals_1 is **only** needed in the backward
@@ -1764,7 +1759,7 @@ def f(a):
             d = b.masked_fill_(c, 0)
             return d
 
-        compiled_f = aot_function(f, nop)
+        compiled_f = aot_function(f, nop, dynamic=True)
         inp_ref = torch.ones(2, 2, requires_grad=True)
         inp_test = torch.ones(2, 2, requires_grad=True)
 
@@ -1859,14 +1854,15 @@ def get_num_ins_outs(fx_g):
     return tuple(len(i) for i in get_ins_outs(fx_g))
 
 
-def get_fw_bw_graph(f, inps, partitioner=min_cut_rematerialization_partition):
+def get_fw_bw_graph(f, inps, partitioner=min_cut_rematerialization_partition, dynamic=False):
     fw_graph_cell = [None]
     bw_graph_cell = [None]
     aot_function(f,
                  fw_compiler=partial(extract_graph, graph_cell=fw_graph_cell),
                  bw_compiler=partial(extract_graph, graph_cell=bw_graph_cell),
                  partition_fn=partitioner,
-                 decompositions=default_decompositions)(*inps).sum().backward()
+                 decompositions=default_decompositions,
+                 dynamic=dynamic)(*inps).sum().backward()
     return (fw_graph_cell[0], bw_graph_cell[0])
 
 
@@ -1933,8 +1929,6 @@ def f(x, mod_weight, mod_bias):
         self.assertEqual(get_num_ins_outs(fw_graph), (3, 6))
         self.assertEqual(get_num_ins_outs(bw_graph), (6, 3))
 
-    @patch("functorch.compile.config.use_dynamic_shapes", True)
-    @patch("functorch.compile.config.use_fake_tensor", True)
     @unittest.skipIf(not USE_NETWORKX, "networkx not available")
     def test_min_cut_partitioner_save_shape(self):
 
@@ -1943,7 +1937,7 @@ def f(x):
             return s
 
         inp = [torch.ones([10, 10], requires_grad=True)]
-        fw_graph, bw_graph = get_fw_bw_graph(f, inp)
+        fw_graph, bw_graph = get_fw_bw_graph(f, inp, dynamic=True)
         _, fw_output = get_ins_outs(fw_graph)
         self.assertEqual(get_num_ins_outs(fw_graph), (1, 3))
         self.assertEqual(get_num_ins_outs(bw_graph), (3, 1))
@@ -1968,14 +1962,12 @@ def f(a, b, c):
             x = sb[0] + sc[0]
             a_sz = (x, a.size(0))
             return torch.cat([a.expand(a_sz), b, c])
-        fw_graph, bw_graph = get_fw_bw_graph(f, inp)
+        fw_graph, bw_graph = get_fw_bw_graph(f, inp, dynamic=True)
         self.assertEqual(get_num_ins_outs(fw_graph), (3, 5))
         self.assertEqual(get_num_ins_outs(bw_graph), (5, 3))
         _, outs = get_ins_outs(fw_graph)
         self.assertTrue(all([is_sym_node(n) for n in outs[1:]]))
 
-    @patch("functorch.compile.config.use_dynamic_shapes", True)
-    @patch("functorch.compile.config.use_fake_tensor", True)
     def test_default_partitioner_output_tensor_shape_tensor(self):
 
         inp = [
@@ -2004,7 +1996,8 @@ def f(a, b, c, d):
             fw_compiler=partial(extract_graph, graph_cell=fw_graph_cell),
             bw_compiler=partial(extract_graph, graph_cell=bw_graph_cell),
             partition_fn=default_partition,
-            decompositions=default_decompositions)(*inp)
+            decompositions=default_decompositions,
+            dynamic=True)(*inp)
         fw_graph = fw_graph_cell[0]
         (compiled_outs[0].sum() + compiled_outs[2].sum()).backward()
         bw_graph = bw_graph_cell[0]
@@ -2037,8 +2030,6 @@ def f(a, b, c, d):
         # TODO(whc) we should learn to return torch.Sizes
         self.assertFalse(isinstance(compiled_outs[1], torch.Size))
 
-    @patch("functorch.compile.config.use_dynamic_shapes", True)
-    @patch("functorch.compile.config.use_fake_tensor", True)
     @unittest.skipIf(not USE_NETWORKX, "networkx not available")
     def test_min_cut_partitioner_output_tensor_shape_tensor(self):
 
@@ -2068,7 +2059,8 @@ def f(a, b, c, d):
             fw_compiler=partial(extract_graph, graph_cell=fw_graph_cell),
             bw_compiler=partial(extract_graph, graph_cell=bw_graph_cell),
             partition_fn=min_cut_rematerialization_partition,
-            decompositions=default_decompositions)(*inp)
+            decompositions=default_decompositions,
+            dynamic=True)(*inp)
         fw_graph = fw_graph_cell[0]
         (compiled_outs[0].sum() + compiled_outs[2].sum()).backward()
         bw_graph = bw_graph_cell[0]
@@ -2617,7 +2609,7 @@ def create_new_arg(x):
     except DynamicOutputShapeException:
         self.skipTest("Dynamic output shape operation in trace")
 
-def _test_aot_autograd_helper(self, device, dtype, op):
+def _test_aot_autograd_helper(self, device, dtype, op, dynamic=False):
     if not op.supports_autograd:
         self.skipTest("Op does not support autograd")
 
@@ -2639,7 +2631,7 @@ def f(args):
             c_args, c_kwargs = pytree.tree_unflatten(cur_flat_args, args_spec)
             return op.op(*c_args, **c_kwargs)
 
-        compiled_f = compiled_function(f, nop, nop)
+        compiled_f = compiled_function(f, nop, nop, dynamic=dynamic)
         try:
             _test_aot_autograd_forwards_backwards_helper(self, f, compiled_f, args)
         except GuardOnDataDependentSymNode:
@@ -2651,7 +2643,7 @@ def f(args):
             else:
                 raise
 
-def _test_aot_autograd_module_helper(self, device, dtype, training, module_info):
+def _test_aot_autograd_module_helper(self, device, dtype, training, module_info, *, dynamic=False):
     module_cls = module_info.module_cls
     module_inputs = module_info.module_inputs_func(module_info, device=device, dtype=dtype,
                                                    requires_grad=True, training=training)
@@ -2696,7 +2688,7 @@ def f(params_buffers_args):
         named_params = dict(m.named_parameters(remove_duplicate=False))
         named_buffers = dict(m.named_buffers(remove_duplicate=False))
         num_params_buffers = len(named_params) + len(named_buffers)
-        compiled_f = aot_function(f, nop, num_params_buffers=num_params_buffers)
+        compiled_f = aot_function(f, nop, num_params_buffers=num_params_buffers, dynamic=dynamic)
         params_buffers_args = [named_params, named_buffers, args]
         _test_aot_autograd_forwards_backwards_helper(self, f, compiled_f, params_buffers_args)
 
@@ -2708,13 +2700,11 @@ def test_aot_autograd_exhaustive(self, device, dtype, op):
         _test_aot_autograd_helper(self, device, dtype, op)
 
     @ops(op_db, allowed_dtypes=(torch.float,))
-    @patch("functorch.compile.config.use_dynamic_shapes", True)
-    @patch("functorch.compile.config.use_fake_tensor", True)
     @patch("functorch.compile.config.use_functionalize", True)
     @skipOps('TestEagerFusionOpInfo', 'test_aot_autograd_symbolic_exhaustive',
              aot_autograd_failures | symbolic_aot_autograd_failures)
     def test_aot_autograd_symbolic_exhaustive(self, device, dtype, op):
-        _test_aot_autograd_helper(self, device, dtype, op)
+        _test_aot_autograd_helper(self, device, dtype, op, dynamic=True)
 
 
 aot_autograd_module_failures = set({
@@ -2754,13 +2744,11 @@ def test_aot_autograd_module_exhaustive(self, device, dtype, training, module_in
         _test_aot_autograd_module_helper(self, device, dtype, training, module_info)
 
     @modules(module_db, allowed_dtypes=(torch.float,))
-    @patch("functorch.compile.config.use_dynamic_shapes", True)
-    @patch("functorch.compile.config.use_fake_tensor", True)
     @patch("functorch.compile.config.use_functionalize", True)
     @decorateForModules(unittest.expectedFailure,
                         aot_autograd_module_failures | symbolic_aot_autograd_module_failures)
     def test_aot_autograd_symbolic_module_exhaustive(self, device, dtype, training, module_info):
-        _test_aot_autograd_module_helper(self, device, dtype, training, module_info)
+        _test_aot_autograd_module_helper(self, device, dtype, training, module_info, dynamic=True)
 
 
 only_for = ("cpu")
diff --git a/torch/_export/__init__.py b/torch/_export/__init__.py
@@ -116,19 +116,9 @@ def set_state_proxies(state_args):
         num_params_buffers=params_len,
         aot_id=-1,
         keep_inference_input_mutations=False,
+        dynamic_shapes=True,
     )
 
-    @contextlib.contextmanager
-    def setup_dynamic_shape():
-        prev, torch._functorch.config.use_dynamic_shapes = (
-            torch._functorch.config.use_dynamic_shapes,
-            True,
-        )
-        try:
-            yield
-        finally:
-            torch._functorch.config.use_dynamic_shapes = prev
-
     def exported_call(*args):
         state_args = args[:params_len]
         unwrapped_state_args = _unwrap_all_tensors_from_functional(
@@ -141,7 +131,7 @@ def exported_call(*args):
         outputs, out_spec = pytree.tree_flatten(outputs)
         return outputs
 
-    with torch.enable_grad(), setup_dynamic_shape():
+    with torch.enable_grad():
         create_aot_dispatcher_function(
             exported_call,
             full_args,
diff --git a/torch/_functorch/aot_autograd.py b/torch/_functorch/aot_autograd.py
@@ -1272,15 +1272,7 @@ class AOTConfig:
     num_params_buffers: int
     aot_id: int
     keep_inference_input_mutations: bool
-    # If None, defer to config
-    _dynamic_shapes: Optional[bool] = None
-
-    @property
-    def dynamic_shapes(self):
-        if self._dynamic_shapes is None:
-            return config.use_dynamic_shapes
-        else:
-            return self._dynamic_shapes
+    dynamic_shapes: bool = False
 
 def aot_dispatch_base(flat_fn, flat_args: List[Tensor], aot_config: AOTConfig):
     with enable_python_dispatcher():
@@ -2331,7 +2323,7 @@ def call_compiled_backward():
                                 aot_config.bw_compiler, None, None,
                                 aot_config.decompositions, 0, aot_config.aot_id,
                                 aot_config.keep_inference_input_mutations,
-                                aot_config._dynamic_shapes
+                                aot_config.dynamic_shapes
                             )
                         )
                     else:
@@ -2563,7 +2555,10 @@ def aot_function(
     num_params_buffers: int = 0,
     hasher_type=None,  # deprecated
     static_argnums: Optional[Tuple[int]] = None,  # deprecated
-    keep_inference_input_mutations: bool = False
+    keep_inference_input_mutations: bool = False,
+    *,
+    # Whether or not to trace with dynamic shapes
+    dynamic=False,
 ) -> Callable:
     """
     Traces the forward and backward graph of :attr:`fn` using torch dispatch
@@ -2630,6 +2625,7 @@ def aot_function(
         num_params_buffers=num_params_buffers,
         aot_id=next(AOT_COUNTER),
         keep_inference_input_mutations=keep_inference_input_mutations,
+        dynamic_shapes=dynamic,
     )
     cached_res = None
 
@@ -2822,8 +2818,6 @@ def functional_call(*args, **kwargs):
         if isinstance(x, FakeTensor):
             dynamic_shapes = x.fake_mode.shape_env is not None
             break
-    else:
-        dynamic_shapes = config.use_dynamic_shapes
 
     aot_config = AOTConfig(
         fw_compiler=fw_compiler,
@@ -2833,7 +2827,7 @@ def functional_call(*args, **kwargs):
         num_params_buffers=params_len,
         aot_id=next(AOT_COUNTER),
         keep_inference_input_mutations=keep_inference_input_mutations,
-        _dynamic_shapes=dynamic_shapes
+        dynamic_shapes=dynamic_shapes
     )
 
     compiled_fn = create_aot_dispatcher_function(
diff --git a/torch/_functorch/config.py b/torch/_functorch/config.py
@@ -31,8 +31,6 @@
 # Prints out joint graph traced, before partitioning
 debug_joint = os.environ.get("AOT_FX_GRAPHS_JOINT", False)
 
-use_dynamic_shapes = os.getenv("AOT_DYNAMIC_SHAPES", False)
-
 static_weight_shapes = True
 
 # Applies CSE to the graph before partitioning