From 4a426d8015bef5a0cb3acff8d4474ee9ab4071d5 Mon Sep 17 00:00:00 2001 From: Gustavo de Rosa Date: Fri, 15 Sep 2023 22:57:07 +0000 Subject: [PATCH] add _no_split_modules property (#17) - add _no_split_modules property (7e925ddfdf2d1bb29fc26db755aafd77fb8f565e) Co-authored-by: wing lian --- modeling_mixformer_sequential.py | 1 + 1 file changed, 1 insertion(+) diff --git a/modeling_mixformer_sequential.py b/modeling_mixformer_sequential.py index 7c10e73..5e3db86 100644 --- a/modeling_mixformer_sequential.py +++ b/modeling_mixformer_sequential.py @@ -717,6 +717,7 @@ class MixFormerSequentialForCausalLM(MixFormerSequentialPreTrainedModel): _keys_to_ignore_on_load_missing = [""] _keys_to_ignore_on_load_unexpected = [r"layers\.\d+\.mlp.(fc_in|fc_out)\.(weight|bias)"] + _no_split_modules = ["ParallelBlock"] def __init__(self, config: MixFormerSequentialConfig) -> None: super().__init__(config)