davda54 commited on
Commit
7450871
·
verified ·
1 Parent(s): 366305d
Files changed (1) hide show
  1. modeling_gptbert.py +1 -1
modeling_gptbert.py CHANGED
@@ -260,7 +260,7 @@ def apply_rotary_unpadded(qkv, cos, sin, cu_seqlens: Optional[torch.Tensor] = No
260
  # from https://github.com/huggingface/transformers/blob/main/src/transformers/models/modernbert/modeling_modernbert.py
261
  class UnpaddedRotaryEmbedding(RotaryEmbedding):
262
  def __init__(self, dim: int, base: float = 10000.0, max_seqlen: Optional[int] = None):
263
- super().__init__(dim=dim, base=base, pos_idx_in_fp32=True, device=None, interleaved=False)
264
  self.max_seqlen = max_seqlen
265
 
266
  def forward(self, qkv: torch.Tensor, cu_seqlens: torch.Tensor, max_seqlen: Optional[int] = None) -> Union[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]:
 
260
  # from https://github.com/huggingface/transformers/blob/main/src/transformers/models/modernbert/modeling_modernbert.py
261
  class UnpaddedRotaryEmbedding(RotaryEmbedding):
262
  def __init__(self, dim: int, base: float = 10000.0, max_seqlen: Optional[int] = None):
263
+ super().__init__(dim=dim, base=base, device=None, interleaved=False)
264
  self.max_seqlen = max_seqlen
265
 
266
  def forward(self, qkv: torch.Tensor, cu_seqlens: torch.Tensor, max_seqlen: Optional[int] = None) -> Union[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]: