iambestfeed
/

imp-v1-3b-mrope

Text Generation

Model card Files Files and versions Community

iambestfeed commited on Mar 16

Commit

cfc5695

·

verified ·

1 Parent(s): dcf1608

Update modeling_imp.py

Files changed (1) hide show

modeling_imp.py +11 -0

modeling_imp.py CHANGED Viewed

@@ -63,6 +63,17 @@ except:
 logger = logging.get_logger(__name__)
 # Copied from transformers.models.llama.modeling_llama.LlamaRotaryEmbedding with Llama->Phi
 class PhiRotaryEmbedding(nn.Module):
     def __init__(self, dim, max_position_embeddings=2048, base=10000, device=None):

 logger = logging.get_logger(__name__)
+def _get_unpad_data(attention_mask):
+    seqlens_in_batch = attention_mask.sum(dim=-1, dtype=torch.int32)
+    indices = torch.nonzero(attention_mask.flatten(), as_tuple=False).flatten()
+    max_seqlen_in_batch = seqlens_in_batch.max().item()
+    cu_seqlens = F.pad(torch.cumsum(seqlens_in_batch, dim=0, dtype=torch.int32), (1, 0))  # pylint: disable=E1102
+    return (
+        indices,
+        cu_seqlens,
+        max_seqlen_in_batch,
+    )
 # Copied from transformers.models.llama.modeling_llama.LlamaRotaryEmbedding with Llama->Phi
 class PhiRotaryEmbedding(nn.Module):
     def __init__(self, dim, max_position_embeddings=2048, base=10000, device=None):