pop block_cls since it's not an actual kwarg
Browse files
src/axolotl/models/phi/modeling_mixformer_sequential.py
CHANGED
@@ -870,7 +870,7 @@ class MixFormerSequentialForCausalLM(MixFormerSequentialPreTrainedModel):
|
|
870 |
# `block_cls` with `legacy` value is for backward compatibility
|
871 |
# `path` key is for backward compatibility
|
872 |
block = copy.deepcopy(block) or {"block_cls": "parallel"}
|
873 |
-
|
874 |
|
875 |
block["block_idx"] = block_idx
|
876 |
modules.append(ParallelBlock(config, **block))
|
|
|
870 |
# `block_cls` with `legacy` value is for backward compatibility
|
871 |
# `path` key is for backward compatibility
|
872 |
block = copy.deepcopy(block) or {"block_cls": "parallel"}
|
873 |
+
block.pop("path", None) or block.pop("block_cls", None)
|
874 |
|
875 |
block["block_idx"] = block_idx
|
876 |
modules.append(ParallelBlock(config, **block))
|