From 8324c4b5b94101f1f61790d5b50e21922376eee8 Mon Sep 17 00:00:00 2001 From: Kofi <74067324+kofi-bhr@users.noreply.github.com> Date: Wed, 23 Oct 2024 14:02:20 -0500 Subject: [PATCH] Obey general token limits - Changed max tokens from 8120 -> 8000 - Works with some models (i.e., Grok) with limits like this - No effect otherwise, single-response limit only --- app/lib/.server/llm/constants.ts | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/app/lib/.server/llm/constants.ts b/app/lib/.server/llm/constants.ts index b24acdf27..7b3a0f245 100644 --- a/app/lib/.server/llm/constants.ts +++ b/app/lib/.server/llm/constants.ts @@ -1,5 +1,5 @@ // see https://docs.anthropic.com/en/docs/about-claude/models -export const MAX_TOKENS = 8192; +export const MAX_TOKENS = 8000; // limits the number of model responses that can be returned in a single request export const MAX_RESPONSE_SEGMENTS = 2;