remove gelu custom impl and use pytorch impl

lakshith-403 · lakshith-403 · commit b3aedf309327 · 2024-07-27T21:28:07.000+05:30
diff --git a/docs/transformers/LoRA/GPT2.py b/docs/transformers/LoRA/GPT2.py
@@ -44,9 +44,6 @@
     "vocab_size": 50257
 }
 
-import math
-from torch import Tensor
-
 
 # from transformers
 class Conv1D(nn.Module):
@@ -74,23 +71,12 @@ def forward(self, x):
         return x
 
 
-# from transformers
-class NewGELUActivation(nn.Module):
-    """
-    Implementation of the GELU activation function currently in Google BERT repo (identical to OpenAI GPT). Also see
-    the Gaussian Error Linear Units paper: https://arxiv.org/abs/1606.08415
-    """
-
-    def forward(self, input: Tensor) -> Tensor:
-        return 0.5 * input * (1.0 + torch.tanh(math.sqrt(2.0 / math.pi) * (input + 0.044715 * torch.pow(input, 3.0))))
-
-
 class HeadFFN(nn.Module):  # todo rename
     def __init__(self, dim):
         super().__init__()
         self.c_fc = Conv1D(dim, config['n_embd'])
         self.c_proj = Conv1D(config['n_embd'], dim)
-        self.act = NewGELUActivation()
+        self.act = nn.functional.gelu
         self.dropout = nn.Dropout(config['resid_pdrop'])
 
     def forward(self, hidden_states):