kernels-community
/

triton-layer-norm

danieldk HF Staff commited on Mar 12

Commit

02598b2

1 Parent(s): 02bea52

Use `torch.amp` rather than deprecated `torch.cuda.amp`

Files changed (1) hide show

torch-ext/triton_layer_norm/layer_norm.py CHANGED Viewed

@@ -10,7 +10,7 @@ import math
 import torch
 import torch.nn.functional as F
-from torch.cuda.amp import custom_fwd, custom_bwd
 import triton
 import triton.language as tl
@@ -981,7 +981,7 @@ class RMSNorm(torch.nn.Module):
 class LayerNormLinearFn(torch.autograd.Function):
     @staticmethod
-    @custom_fwd
     def forward(
         ctx,
         x,
@@ -1040,7 +1040,7 @@ class LayerNormLinearFn(torch.autograd.Function):
         return out if not prenorm else (out, residual_out.reshape(x_shape_og))
     @staticmethod
-    @custom_bwd
     def backward(ctx, dout, *args):
         x, norm_weight, norm_bias, linear_weight, mean, rstd = ctx.saved_tensors
         dout = dout.reshape(-1, dout.shape[-1])

 import torch
 import torch.nn.functional as F
+from torch.amp import custom_fwd, custom_bwd
 import triton
 import triton.language as tl
 class LayerNormLinearFn(torch.autograd.Function):
     @staticmethod
+    @custom_fwd(device_type="cuda")
     def forward(
         ctx,
         x,
         return out if not prenorm else (out, residual_out.reshape(x_shape_og))
     @staticmethod
+    @custom_bwd(device_type="cuda")
     def backward(ctx, dout, *args):
         x, norm_weight, norm_bias, linear_weight, mean, rstd = ctx.saved_tensors
         dout = dout.reshape(-1, dout.shape[-1])