From 403a105f85f3b6ab4ec13467944805178694a055 Mon Sep 17 00:00:00 2001 From: WangErXiao <863579016@qq.com> Date: Tue, 31 Dec 2024 17:20:16 +0800 Subject: [PATCH] log GPU blocks num for MultiprocExecutor --- vllm/v1/executor/multiproc_executor.py | 1 + 1 file changed, 1 insertion(+) diff --git a/vllm/v1/executor/multiproc_executor.py b/vllm/v1/executor/multiproc_executor.py index ed64e7741390d..9333997d5a29b 100644 --- a/vllm/v1/executor/multiproc_executor.py +++ b/vllm/v1/executor/multiproc_executor.py @@ -81,6 +81,7 @@ def initialize(self, num_gpu_blocks: int) -> None: Initialize the KV caches and begin the model execution loop of the underlying workers. """ + logger.info("# GPU blocks: %d", num_gpu_blocks) self.collective_rpc("initialize_cache", args=(num_gpu_blocks, )) self.collective_rpc("compile_or_warm_up_model")