added layer_norm converter

John Welsh · John Welsh · commit fcc3d96fb24c · 2021-06-15T22:08:56.000Z
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -2,6 +2,7 @@
 
 ## [Master]
 
+- Added converter for ``torch.nn.functional.layer_norm``
 - Added converter for ``torch.nn.functional.gelu``
 - Added converter for ``torch.nn.functional.linear``
 - Added converter for ``torch.nn.functional.silu``
diff --git a/torch2trt/converters/__init__.py b/torch2trt/converters/__init__.py
@@ -30,10 +30,11 @@
 from .floordiv import *
 from .gelu import *
 from .getitem import *
+from .group_norm import *
 from .identity import *
 from .instance_norm import *
 from .interpolate import *
-from .group_norm import *
+from .layer_norm import *
 from .max import *
 from .max_pool2d import *
 from .mean import *
diff --git a/torch2trt/converters/layer_norm.py b/torch2trt/converters/layer_norm.py
@@ -0,0 +1,103 @@
+from torch2trt.torch2trt import *
+from torch2trt.module_test import add_module_test
+
+
+@tensorrt_converter('torch.nn.functional.layer_norm')
+def convert_layernorm(ctx):
+    input = get_arg(ctx, 'input', 0, None)
+    shape = get_arg(ctx, 'normalized_shape', 1, None)
+    weight = get_arg(ctx, 'weight', 2, None)
+    bias = get_arg(ctx, 'bias', 3, None)
+    eps = get_arg(ctx, 'eps', 4, 1e-05)
+    output = ctx.method_return
+    
+    input_trt, eps_trt = add_missing_trt_tensors(
+        ctx.network,
+        [input, eps]
+    )
+    
+    input_trt, eps_trt = broadcast_trt_tensors(
+        ctx.network, 
+        [input_trt, eps_trt],
+        len(output.shape) - 1
+    )
+    
+    if weight is not None:
+        _, weight_trt = add_missing_trt_tensors(
+            ctx.network,
+            [input, weight]
+        )
+        _, weight_trt = broadcast_trt_tensors(
+            ctx.network, 
+            [input_trt, weight_trt],
+            len(output.shape) - 1
+        )
+    
+    if bias is not None:
+        _, bias_trt = add_missing_trt_tensors(
+            ctx.network,
+            [input, bias]
+        )
+        _, bias_trt = broadcast_trt_tensors(
+            ctx.network, 
+            [input_trt, bias_trt],
+            len(output.shape) - 1
+        )
+    
+    if isinstance(shape, int):
+        shape = (shape,)
+    dim = tuple([-i - 1 for i in range(len(shape))])
+    dim = torch_dim_resolve_negative(dim, len(input.shape))
+    axes = torch_dim_to_trt_axes(dim)
+    
+    ux = ctx.network.add_reduce(input_trt, trt.ReduceOperation.AVG, axes, keep_dims=True).get_output(0)
+    numerator = ctx.network.add_elementwise(input_trt, ux, trt.ElementWiseOperation.SUB).get_output(0)
+    varx = ctx.network.add_elementwise(numerator, numerator, trt.ElementWiseOperation.PROD).get_output(0)
+    varx = ctx.network.add_reduce(varx, trt.ReduceOperation.AVG, axes, keep_dims=True).get_output(0)
+    denom = ctx.network.add_elementwise(varx, eps_trt, trt.ElementWiseOperation.SUM).get_output(0)
+    denom = ctx.network.add_unary(denom, trt.UnaryOperation.SQRT).get_output(0)
+    y = ctx.network.add_elementwise(numerator, denom, trt.ElementWiseOperation.DIV).get_output(0)
+    
+    if weight is not None:
+        y = ctx.network.add_elementwise(y, weight_trt, trt.ElementWiseOperation.PROD).get_output(0)
+        
+    if bias is not None:
+        y = ctx.network.add_elementwise(y, bias_trt, trt.ElementWiseOperation.SUM).get_output(0)
+    
+    output._trt = y
+    
+    
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 3)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 3)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 5, 3)])
+def test_layer_norm_1d():
+    return torch.nn.LayerNorm(3)
+
+    
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 3)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 5, 3)])
+def test_layer_norm_2d():
+    return torch.nn.LayerNorm((5, 3))
+
+
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 5, 3)])
+def test_layer_norm_3d():
+    return torch.nn.LayerNorm((5, 5, 3))
+
+
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 3)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 3)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 5, 3)])
+def test_layer_norm_1d_nonaffine():
+    return torch.nn.LayerNorm(3, elementwise_affine=False)
+
+    
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 3)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 5, 3)])
+def test_layer_norm_2d_nonaffine():
+    return torch.nn.LayerNorm((5, 3), elementwise_affine=False)
+
+
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 5, 3)])
+def test_layer_norm_3d_nonaffine():
+    return torch.nn.LayerNorm((5, 5, 3), elementwise_affine=False)
diff --git a/torch2trt/torch2trt.py b/torch2trt/torch2trt.py
@@ -87,6 +87,17 @@ def trt_num_outputs(engine):
     return count
 
 
+def torch_dim_resolve_negative(dim, ndim):
+    if not isinstance(dim, tuple):
+        dim = (dim,)
+    pos = []
+    for d in dim:
+        if d < 0:
+            d = ndim + d
+        pos.append(d)
+    return tuple(pos)
+
+
 def torch_dim_to_trt_axes(dim):
     """Converts torch dim, or tuple of dims to a tensorrt axes bitmask"""
     if not isinstance(dim, tuple):