diff --git a/samples/cpp/speculative_decoding_lm/speculative_decoding_lm.cpp b/samples/cpp/speculative_decoding_lm/speculative_decoding_lm.cpp index 6c1a8eea9b..487296566b 100644 --- a/samples/cpp/speculative_decoding_lm/speculative_decoding_lm.cpp +++ b/samples/cpp/speculative_decoding_lm/speculative_decoding_lm.cpp @@ -27,7 +27,7 @@ int main(int argc, char* argv[]) try { std::string main_device = "CPU", draft_device = "CPU"; ov::genai::SchedulerConfig scheduler_config; - scheduler_config.cache_size = 1; + scheduler_config.cache_size = 5; ov::genai::LLMPipeline pipe( main_model_path,