fix
Browse files- modeling_gptbert.py +1 -1
modeling_gptbert.py
CHANGED
@@ -260,7 +260,7 @@ def apply_rotary_unpadded(qkv, cos, sin, cu_seqlens: Optional[torch.Tensor] = No
|
|
260 |
# from https://github.com/huggingface/transformers/blob/main/src/transformers/models/modernbert/modeling_modernbert.py
|
261 |
class UnpaddedRotaryEmbedding(RotaryEmbedding):
|
262 |
def __init__(self, dim: int, base: float = 10000.0, max_seqlen: Optional[int] = None):
|
263 |
-
super().__init__(dim=dim, base=base,
|
264 |
self.max_seqlen = max_seqlen
|
265 |
|
266 |
def forward(self, qkv: torch.Tensor, cu_seqlens: torch.Tensor, max_seqlen: Optional[int] = None) -> Union[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]:
|
|
|
260 |
# from https://github.com/huggingface/transformers/blob/main/src/transformers/models/modernbert/modeling_modernbert.py
|
261 |
class UnpaddedRotaryEmbedding(RotaryEmbedding):
|
262 |
def __init__(self, dim: int, base: float = 10000.0, max_seqlen: Optional[int] = None):
|
263 |
+
super().__init__(dim=dim, base=base, device=None, interleaved=False)
|
264 |
self.max_seqlen = max_seqlen
|
265 |
|
266 |
def forward(self, qkv: torch.Tensor, cu_seqlens: torch.Tensor, max_seqlen: Optional[int] = None) -> Union[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]:
|