NohTow commited on Oct 8, 2024

Commit

ce9aa51

1 Parent(s): e533a59

Using dict as input

Browse files

Files changed (30) hide show

README.md +0 -0
__init__.py +0 -0
__pycache__/__init__.cpython-311.pyc +0 -0
__pycache__/activation.cpython-311.pyc +0 -0
__pycache__/attention.cpython-311.pyc +0 -0
__pycache__/bert_padding.cpython-311.pyc +0 -0
__pycache__/configuration_bert.cpython-311.pyc +0 -0
__pycache__/embeddings.cpython-311.pyc +0 -0
__pycache__/initialization.cpython-311.pyc +0 -0
__pycache__/layers.cpython-311.pyc +0 -0
__pycache__/mlp.cpython-311.pyc +0 -0
__pycache__/modeling_flexbert.cpython-311.pyc +0 -0
__pycache__/normalization.cpython-311.pyc +0 -0
__pycache__/padding.cpython-311.pyc +0 -0
__pycache__/rotary.cpython-311.pyc +0 -0
__pycache__/utils.cpython-311.pyc +0 -0
activation.py +0 -0
attention.py +0 -0
bert_padding.py +0 -0
configuration_bert.py +0 -0
embeddings.py +0 -0
initialization.py +0 -0
layers.py +0 -0
mlp.py +0 -0
modeling_flexbert.py +27 -9
normalization.py +0 -0
options.py +0 -0
padding.py +0 -0
rotary.py +0 -0
utils.py +0 -0

README.md CHANGED Viewed

File without changes

__init__.py CHANGED Viewed

File without changes

__pycache__/__init__.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/activation.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/attention.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/bert_padding.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/configuration_bert.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/embeddings.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/initialization.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/layers.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/mlp.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/modeling_flexbert.cpython-311.pyc CHANGED Viewed

Binary files a/__pycache__/modeling_flexbert.cpython-311.pyc and b/__pycache__/modeling_flexbert.cpython-311.pyc differ

__pycache__/normalization.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/padding.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/rotary.cpython-311.pyc CHANGED Viewed

File without changes

__pycache__/utils.cpython-311.pyc CHANGED Viewed

File without changes

activation.py CHANGED Viewed

File without changes

attention.py CHANGED Viewed

File without changes

bert_padding.py CHANGED Viewed

File without changes

configuration_bert.py CHANGED Viewed

File without changes

embeddings.py CHANGED Viewed

File without changes

initialization.py CHANGED Viewed

File without changes

layers.py CHANGED Viewed

File without changes

mlp.py CHANGED Viewed

File without changes

modeling_flexbert.py CHANGED Viewed

@@ -50,7 +50,7 @@ import os
 import sys
 import warnings
 from dataclasses import dataclass
-from typing import List, Optional, Tuple, Union
 # Add folder root to path to allow us to use relative imports regardless of what directory the script is run from
 sys.path.append(os.path.dirname(os.path.realpath(__file__)))
@@ -944,18 +944,36 @@ class FlexBertModel(FlexBertPreTrainedModel):
     def forward(
         self,
-        input_ids: torch.Tensor,
-        attention_mask: Optional[torch.Tensor] = None,
-        position_ids: Optional[torch.Tensor] = None,
-        indices: Optional[torch.Tensor] = None,
-        cu_seqlens: Optional[torch.Tensor] = None,
-        max_seqlen: Optional[int] = None,
         **kwargs,
     ) -> Tuple[Union[List[torch.Tensor], torch.Tensor], Optional[torch.Tensor]]:
-        if attention_mask is None:
             attention_mask = torch.ones_like(input_ids)
         embedding_output = self.embeddings(input_ids, position_ids)
         encoder_outputs = self.encoder(
             hidden_states=embedding_output,

 import sys
 import warnings
 from dataclasses import dataclass
+from typing import List, Optional, Tuple, Union, Dict
 # Add folder root to path to allow us to use relative imports regardless of what directory the script is run from
 sys.path.append(os.path.dirname(os.path.realpath(__file__)))
     def forward(
         self,
+        features: Dict[str, torch.Tensor],
+        # input_ids: torch.Tensor,
+        # attention_mask: Optional[torch.Tensor] = None,
+        # position_ids: Optional[torch.Tensor] = None,
+        # indices: Optional[torch.Tensor] = None,
+        # cu_seqlens: Optional[torch.Tensor] = None,
+        # max_seqlen: Optional[int] = None,
         **kwargs,
     ) -> Tuple[Union[List[torch.Tensor], torch.Tensor], Optional[torch.Tensor]]:
+        if features["attention_mask"] is None:
             attention_mask = torch.ones_like(input_ids)
+        else:
+            attention_mask = features["attention_mask"]
+        input_ids = features["input_ids"]
+        if "position_ids" not in features:
+            position_ids = None
+        else:
+            position_ids = features["position_ids"]
         embedding_output = self.embeddings(input_ids, position_ids)
+        if "indices" not in features:
+            indices = None
+        else:
+            indices = features["indices"]
+        if "cu_seqlens" not in features:
+            cu_seqlens = None
+        else:
+            cu_seqlens = features["cu_seqlens"]
+        if "max_seqlen" not in features:
+            max_seqlen = None
         encoder_outputs = self.encoder(
             hidden_states=embedding_output,

normalization.py CHANGED Viewed

File without changes

options.py CHANGED Viewed

File without changes

padding.py CHANGED Viewed

File without changes

rotary.py CHANGED Viewed

File without changes

utils.py CHANGED Viewed

File without changes