diff --git a/vllm/v1/executor/multiproc_executor.py b/vllm/v1/executor/multiproc_executor.py index ed64e7741390d..9333997d5a29b 100644 --- a/vllm/v1/executor/multiproc_executor.py +++ b/vllm/v1/executor/multiproc_executor.py @@ -81,6 +81,7 @@ def initialize(self, num_gpu_blocks: int) -> None: Initialize the KV caches and begin the model execution loop of the underlying workers. """ + logger.info("# GPU blocks: %d", num_gpu_blocks) self.collective_rpc("initialize_cache", args=(num_gpu_blocks, )) self.collective_rpc("compile_or_warm_up_model")