Update on "enable TritonFusedRMSNorm with local_map annotation"

[ghstack-poisoned]
pytorch · Jun 4, 2024 · 71659de · 71659de
1 parent aa5af1b
commit 71659de
Showing 1 changed file with 0 additions and 7 deletions.
diff --git a/torchtitan/models/norms.py b/torchtitan/models/norms.py
@@ -14,7 +14,6 @@
 import triton
 import triton.language as tl
 
-from torch.distributed._functional_collectives import AsyncCollectiveTensor
 from torch.distributed._tensor.experimental import local_map
 from torch.distributed._tensor.placement_types import _Partial, Replicate, Shard
 
@@ -227,9 +226,6 @@ class TritonFusedRMSNorm(torch.autograd.Function):
     )
     @staticmethod
     def forward(ctx, x, weight, eps):
-        if isinstance(x, AsyncCollectiveTensor):
-            x = x.wait()
-
         x_shape_start = x.shape
 
         # Flatten input
@@ -277,9 +273,6 @@ def forward(ctx, x, weight, eps):
     )
     @staticmethod
     def backward(ctx, dy):
-        if isinstance(dy, AsyncCollectiveTensor):
-            dy = dy.wait()
-
         x, weight, rstd = ctx.saved_tensors
         eps = ctx.eps
         x_shape_start = ctx.x_shape_start