added gelu converter

John Welsh · John Welsh · commit 6df2e1f14f78 · 2021-06-15T21:07:39.000Z
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -2,6 +2,10 @@
 
 ## [Master]
 
+- Added converter for ``torch.nn.functional.gelu``
+- Added converter for ``torch.nn.functional.linear``
+- Added converter for ``torch.nn.functional.silu``
+
 ## [0.2.0] - 03/02/2021
 
 - Added converter for ``torch.Tensor.flatten``
diff --git a/torch2trt/converters/__init__.py b/torch2trt/converters/__init__.py
@@ -28,6 +28,7 @@
 from .div import *
 from .expand import *
 from .floordiv import *
+from .gelu import *
 from .getitem import *
 from .identity import *
 from .instance_norm import *
diff --git a/torch2trt/converters/gelu.py b/torch2trt/converters/gelu.py
@@ -0,0 +1,63 @@
+from torch2trt.torch2trt import *
+from torch2trt.module_test import add_module_test
+import math
+
+
+@tensorrt_converter('torch.nn.functional.gelu')
+def convert_gelu_v1(ctx):
+    # approximate equation 1 from paper
+    input = get_arg(ctx, 'input', 0, None)
+    output = ctx.method_return
+    
+    x, c05, c1, cs2pi, c044, c3 = add_missing_trt_tensors(
+        ctx.network,
+        [input, 0.5, 1.0, math.sqrt(2.0 / math.pi), 0.044715, 3.0]
+    )
+    
+    x, c05, c1, cs2pi, c044, c3 = broadcast_trt_tensors(
+        ctx.network, 
+        [x, c05, c1, cs2pi, c044, c3], 
+        len(output.shape) - 1
+    )
+    
+    y = ctx.network.add_elementwise(x, c3, trt.ElementWiseOperation.POW).get_output(0)
+    y = ctx.network.add_elementwise(y, c044, trt.ElementWiseOperation.PROD).get_output(0)
+    y = ctx.network.add_elementwise(x, y, trt.ElementWiseOperation.SUM).get_output(0)
+    y = ctx.network.add_elementwise(y, cs2pi, trt.ElementWiseOperation.PROD).get_output(0)
+    y = ctx.network.add_activation(y, trt.ActivationType.TANH).get_output(0)
+    y = ctx.network.add_elementwise(y, c1, trt.ElementWiseOperation.SUM).get_output(0)
+    y = ctx.network.add_elementwise(x, y, trt.ElementWiseOperation.PROD).get_output(0)
+    y = ctx.network.add_elementwise(y, c05, trt.ElementWiseOperation.PROD).get_output(0)
+    
+    output._trt = y
+    
+    
+# @tensorrt_converter('torch.nn.functional.gelu')
+# def convert_gelu_v2(ctx):
+#     # approximate equation 1 from paper
+#     input = get_arg(ctx, 'input', 0, None)
+#     output = ctx.method_return
+    
+#     x, c1702 = add_missing_trt_tensors(
+#         ctx.network,
+#         [input, 1.702]
+#     )
+    
+#     x, c1702 = broadcast_trt_tensors(
+#         ctx.network, 
+#         [x, c1702], 
+#         len(output.shape) - 1
+#     )
+    
+#     y = ctx.network.add_elementwise(x, c1702, trt.ElementWiseOperation.PROD).get_output(0)
+#     y = ctx.network.add_activation(y, trt.ActivationType.SIGMOID).get_output(0)
+#     y = ctx.network.add_elementwise(x, y, trt.ElementWiseOperation.PROD).get_output(0)
+    
+#     output._trt = y
+
+
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 3)])
+@add_module_test(torch.float32, torch.device('cuda'), [(1, 5, 3, 3)])
+def test_silu():
+    return torch.nn.GELU()