diff --git a/onn/activation.py b/onn/activation.py index 23d5fcd..f06c2ec 100644 --- a/onn/activation.py +++ b/onn/activation.py @@ -120,7 +120,7 @@ class GeluApprox(Swish): # plot: https://www.desmos.com/calculator/ydzgtccsld def __init__(self): - super().__init__(_f(1.704)) + super().__init__(_f(1.702)) class Gelu(Activation):