diff --git a/config.json b/config.json index 90ea1e0..b51379b 100644 --- a/config.json +++ b/config.json @@ -16,7 +16,7 @@ "model_type": "phi", "num_attention_heads": 32, "num_hidden_layers": 24, - "num_key_value_heads": 32, + "num_key_value_heads": null, "partial_rotary_factor": 0.5, "qk_layernorm": false, "resid_pdrop": 0.0,