This commit is contained in:
Varuna Jayasiri
2022-06-03 17:23:39 +05:30
parent 321339eeb0
commit 09d2210aac
2 changed files with 2 additions and 2 deletions

View File

@ -201,7 +201,7 @@ class RotaryPEMultiHeadAttention(MultiHeadAttention):
"""
def __init__(self, heads: int, d_model: int, rope_percentage: float = 0.5, dropout_prob: float = 0.0):
super().__init__(heads, d_model, dropout_prob, bias=False)
super().__init__(heads, d_model, dropout_prob)
# Rotary positional embedding layers
d_rope = int(self.d_k * rope_percentage)

View File

@ -174,7 +174,7 @@ class RotaryValuePEMultiHeadAttention(MultiHeadAttention):
def __init__(self, heads: int, d_model: int,
rope_percentage: float = 0.5, rope_value_percentage: float = 0.5,
dropout_prob: float = 0.0):
super().__init__(heads, d_model, dropout_prob, bias=False)
super().__init__(heads, d_model, dropout_prob)
# Rotary positional embedding layers
d_rope = int(self.d_k * rope_percentage)