comment on gelu function
This commit is contained in:
@@ -28,8 +28,8 @@ from torch.nn import CrossEntropyLoss
|
|||||||
|
|
||||||
def gelu(x):
|
def gelu(x):
|
||||||
return x * 0.5 * (1.0 + torch.erf(x / math.sqrt(2.0)))
|
return x * 0.5 * (1.0 + torch.erf(x / math.sqrt(2.0)))
|
||||||
# OpenAI GPT gelu version :
|
# For information: OpenAI GPT gelu version is a bit different:
|
||||||
# return 0.5 * x * (1 + torch.tanh(math.sqrt(2 / math.pi) * (x + 0.044715 * torch.pow(x, 3))))
|
# 0.5 * x * (1 + torch.tanh(math.sqrt(2 / math.pi) * (x + 0.044715 * torch.pow(x, 3))))
|
||||||
|
|
||||||
|
|
||||||
class BertConfig(object):
|
class BertConfig(object):
|
||||||
|
|||||||
Reference in New Issue
Block a user