diff --git a/modeling_stablelm_epoch.py b/modeling_stablelm_epoch.py index e7fde9f..b179cfb 100755 --- a/modeling_stablelm_epoch.py +++ b/modeling_stablelm_epoch.py @@ -545,7 +545,7 @@ class StableLMEpochPreTrainedModel(PreTrainedModel): """ config_class = StableLMEpochConfig - base_model_prefix = "transformer" + base_model_prefix = "model" supports_gradient_checkpointing = True _no_split_modules = ["DecoderLayer"] _skip_keys_device_placement = "past_key_values"