Revert "[dynamo][fsdp] Consistent behavior of int attributes (#157262)"

This reverts commit 178fe7aa98987111a73534375099f4ad255e8b59. Reverted https://github.com/pytorch/pytorch/pull/157262 on behalf of https://github.com/huydhn due to This fails some internal tests and needs to be relanded ([comment](https://github.com/pytorch/pytorch/pull/157262#issuecomment-3059463896))
2025-10-20 21:14:14 +08:00 · 2025-07-10 23:11:18 +00:00
parent 1a195bf7d6
commit e517066f41
4 changed files with 11 additions and 98 deletions
--- a/test/distributed/test_dynamo_distributed.py
+++ b/test/distributed/test_dynamo_distributed.py
@ -678,88 +678,6 @@ class TestMultiProc(DynamoDistributedMultiProcTestCase):
            outputs = fsdp_m(inputs)
            self.assertTrue(same(correct_outputs, outputs))

-    @config.patch(enable_compiler_collectives=True)
-    @skip_if_lt_x_gpu(1)
-    def test_fsdp_dynamism_on_int_attr(self):
-        global GUARDS_FILE
-        GUARDS_FILE = StringIO()
-
-        with _dynamo_dist_per_rank_init(self.rank, self.world_size):
-
-            class ToyModelWithIntAttr(nn.Module):
-                def __init__(self):
-                    super().__init__()
-                    self.attr = 2
-
-                def forward(self, x):
-                    out = x + self.attr
-
-                    @comptime
-                    def _(ctx):
-                        ctx.print_guards(file=GUARDS_FILE)
-
-                    return out
-
-            def get_model_with_int_attr(device):
-                m = ToyModelWithIntAttr().to(device)
-                inputs = torch.rand(10).to(device)
-                outputs = m(inputs)
-                return m, inputs, outputs
-
-            m, inputs, correct_outputs = get_model_with_int_attr(f"cuda:{self.rank}")
-            fsdp_m = FSDP(m, use_orig_params=True)
-            compiled_fsdp_m = torch.compile(
-                fsdp_m, backend="eager", dynamic=True, fullgraph=True
-            )
-            outputs = compiled_fsdp_m(inputs)
-            self.assertTrue(same(correct_outputs, outputs))
-
-            FileCheck().check(
-                """local_fsdp_module "L['fn']._modules['_fsdp_wrapped_module'].attr" EQUALS_MATCH"""
-            ).run(GUARDS_FILE.getvalue())
-
-    @config.patch(enable_compiler_collectives=True)
-    @config.patch(allow_unspec_int_on_fsdp_module=True)
-    @skip_if_lt_x_gpu(1)
-    def test_fsdp_dynamism_on_int_attr_unspec(self):
-        global GUARDS_FILE
-        GUARDS_FILE = StringIO()
-
-        with _dynamo_dist_per_rank_init(self.rank, self.world_size):
-
-            class ToyModelWithIntAttr(nn.Module):
-                def __init__(self):
-                    super().__init__()
-                    self.attr = 2
-
-                def forward(self, x):
-                    out = x + self.attr
-
-                    @comptime
-                    def _(ctx):
-                        ctx.print_guards(file=GUARDS_FILE)
-
-                    return out
-
-            def get_model_with_int_attr(device):
-                m = ToyModelWithIntAttr().to(device)
-                inputs = torch.rand(10).to(device)
-                outputs = m(inputs)
-                return m, inputs, outputs
-
-            m, inputs, correct_outputs = get_model_with_int_attr(f"cuda:{self.rank}")
-            fsdp_m = FSDP(m, use_orig_params=True)
-            compiled_fsdp_m = torch.compile(
-                fsdp_m, backend="eager", dynamic=True, fullgraph=True
-            )
-            outputs = compiled_fsdp_m(inputs)
-            self.assertTrue(same(correct_outputs, outputs))
-
-            # No presence of EQUALS_MATCH because the guard will be dynamic
-            FileCheck().check(
-                """local_fsdp_module "L['fn']._modules['_fsdp_wrapped_module'].attr" TYPE_MATCH"""
-            ).run(GUARDS_FILE.getvalue())
-
    @skip_if_lt_x_gpu(2)
    @unittest.skipIf(not HAS_GPU, "Inductor+gpu needs triton and recent GPU arch")
    def test_ddp_optimizer_cudagraph(self):
--- a/torch/_dynamo/config.py
+++ b/torch/_dynamo/config.py
@ -284,13 +284,6 @@ force_unspec_int_unbacked_size_like_on_torchrec_kjt = False
 # Defaults to False for BC.
 allow_unspec_int_on_nn_module = False

-# Mirrors `allow_unspec_int_on_nn_module`, but for FSDP: for <=2.8 versions,
-# integer attributes on FSDP modules were treated as dynamic, while the same
-# attributes on plain nn.Modules were static. We unified the behaviour by making
-# FSDP ints static too. Set this flag to True to restore the legacy dynamic
-# handling if needed.
-allow_unspec_int_on_fsdp_module = False
-
 # Specify how to optimize a compiled DDP module. The flag accepts a boolean
 # value or a string. There are 3 modes.
 # 1. "ddp_optimizer" (or True): with "ddp_optimizer", Dynamo will automatically
--- a/torch/_dynamo/utils.py
+++ b/torch/_dynamo/utils.py
@ -2400,15 +2400,6 @@ def is_int_specialization_case(value, source):
            source.guard_source().is_specialized_nn_module()
            and not config.allow_unspec_int_on_nn_module
        )
-        # integers coming from FSDP modules are considered static. This is
-        # purely empirical and perhaps we should have a better heuristic.
-        or (
-            source.guard_source().is_fsdp_module()
-            and not (
-                config.allow_unspec_int_on_nn_module
-                or config.allow_unspec_int_on_fsdp_module
-            )
-        )
        or (
            source.guard_source().is_unspecialized_builtin_nn_module()
            and not config.allow_unspec_int_on_nn_module
--- a/torch/_guards.py
+++ b/torch/_guards.py
@ -155,6 +155,17 @@ class GuardSource(enum.Enum):
        return self in (GuardSource.GLOBAL_FSDP_MODULE, GuardSource.LOCAL_FSDP_MODULE)

    def is_specialized_nn_module(self) -> bool:
+        import torch._dynamo.config as config
+
+        if config._unsafe_skip_fsdp_module_guards:
+            return (
+                self
+                in (
+                    GuardSource.GLOBAL_SPECIALIZED_NN_MODULE,
+                    GuardSource.LOCAL_SPECIALIZED_NN_MODULE,
+                )
+                or self.is_fsdp_module()
+            )
        return self in (
            GuardSource.GLOBAL_SPECIALIZED_NN_MODULE,
            GuardSource.LOCAL_SPECIALIZED_NN_MODULE,