From 0e947948134359f9b0281e1f3b95f1c59300b126 Mon Sep 17 00:00:00 2001 From: xuhaifeng Date: Thu, 29 Feb 2024 15:50:49 +0800 Subject: [PATCH] fix minicpm --- src/models/minicpm.cpp | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/src/models/minicpm.cpp b/src/models/minicpm.cpp index b9f89200..7085b7a6 100644 --- a/src/models/minicpm.cpp +++ b/src/models/minicpm.cpp @@ -53,13 +53,13 @@ namespace fastllm { this->user_role = "### Instruction:\n"; this->bot_role = "\n\n### Response:"; */ - this->history_sep = ""; + this->history_sep = ""; this->pre_prompt = ""; this->user_role = ""; this->bot_role = ""; - block_cnt = 32; - rotary_dim = 128; + block_cnt = 40; + rotary_dim = 64; sin.resize(max_positions); cos.resize(max_positions); @@ -1074,7 +1074,7 @@ namespace fastllm { context->Init(this->block_cnt); context->currentTokens = inputTokens; - //context->currentTokens.insert(context->currentTokens.begin(), this->bos_token_id); + context->currentTokens.insert(context->currentTokens.begin(), this->bos_token_id); context->generationConfig = generationConfig; context->tokens = LastTokensUnit(generationConfig.last_n); dictLocker.unlock();