From 7e925ddfdf2d1bb29fc26db755aafd77fb8f565e Mon Sep 17 00:00:00 2001 From: wing lian Date: Fri, 15 Sep 2023 17:21:11 +0000 Subject: [PATCH] add _no_split_modules property --- modeling_mixformer_sequential.py | 1 + 1 file changed, 1 insertion(+) diff --git a/modeling_mixformer_sequential.py b/modeling_mixformer_sequential.py index 7c10e73..5e3db86 100644 --- a/modeling_mixformer_sequential.py +++ b/modeling_mixformer_sequential.py @@ -717,6 +717,7 @@ class MixFormerSequentialForCausalLM(MixFormerSequentialPreTrainedModel): _keys_to_ignore_on_load_missing = [""] _keys_to_ignore_on_load_unexpected = [r"layers\.\d+\.mlp.(fc_in|fc_out)\.(weight|bias)"] + _no_split_modules = ["ParallelBlock"] def __init__(self, config: MixFormerSequentialConfig) -> None: super().__init__(config)