From 852291726650c8dd6ac78721c2c4d0fbdafc8e3d Mon Sep 17 00:00:00 2001 From: "Charles O. Goddard" Date: Fri, 4 Oct 2024 16:43:03 -0700 Subject: [PATCH] Update Llama architecture to handle 3b/1b (#429) --- mergekit/_data/architectures/llama.json | 6 ++---- 1 file changed, 2 insertions(+), 4 deletions(-) diff --git a/mergekit/_data/architectures/llama.json b/mergekit/_data/architectures/llama.json index 3095b207..7106806b 100644 --- a/mergekit/_data/architectures/llama.json +++ b/mergekit/_data/architectures/llama.json @@ -73,10 +73,8 @@ { "name": "lm_head.weight", "input_space": "running_residual", - "is_embed":true, - "aliases": [ - "model.lm_head.weight" - ] + "is_embed": true, + "optional": true } ] }