From dcf8c316997f97c79650e38236b6b93934068416 Mon Sep 17 00:00:00 2001 From: Elliot Stein Date: Thu, 31 Oct 2024 12:44:50 +0000 Subject: [PATCH] missing param in gpt2 config --- mergekit/_data/architectures/gpt2.json | 3 +++ 1 file changed, 3 insertions(+) diff --git a/mergekit/_data/architectures/gpt2.json b/mergekit/_data/architectures/gpt2.json index 64a04e9d..0a119721 100644 --- a/mergekit/_data/architectures/gpt2.json +++ b/mergekit/_data/architectures/gpt2.json @@ -23,6 +23,9 @@ "num_layers_config_key": "n_layer", "layer_templates": { "weights": [ + { + "name": "h.${layer_index}.attn.bias" + }, { "name": "h.${layer_index}.attn.c_attn.weight" },