From 3a64932e1ff46a56eebc206b9b0c1d27c9d9e1e1 Mon Sep 17 00:00:00 2001 From: Xuan Son Nguyen Date: Mon, 23 Sep 2024 14:26:00 +0200 Subject: [PATCH] small fix --- examples/server/server.cpp | 6 ++---- 1 file changed, 2 insertions(+), 4 deletions(-) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 771bde19112a7..3693cf747a72c 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -1837,10 +1837,8 @@ struct server_context { if (slot.ga_n == 1) { if (slot.is_processing() && (int) system_tokens.size() + slot.n_past >= slot.n_ctx - 1) { if (!params.ctx_shift) { - // this check is redundant (for good) - // we should never get here, since n_predict is already limited - slot.release(); - send_error(slot, "context shift is disabled", ERROR_TYPE_SERVER); + // we should never get here, because generation should already stopped in process_token() + GGML_ASSERT(false && "context shifting is disabled"); continue; }