Skip to content

Commit 57d5777

Browse files
hfansierraisland
authored andcommitted
[Misc] Report TPU usage (#925)
Signed-off-by: Hongmin Fan <[email protected]>
1 parent a6666ca commit 57d5777

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

tpu_inference/worker/tpu_worker_jax.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,7 @@
1616
init_distributed_environment)
1717
from vllm.lora.request import LoRARequest
1818
from vllm.tasks import SupportedTask
19+
from vllm.v1 import utils as vllm_utils
1920
from vllm.v1.core.kv_cache_utils import get_num_blocks, get_uniform_page_size
2021
from vllm.v1.core.sched.output import SchedulerOutput
2122
from vllm.v1.kv_cache_interface import KVCacheConfig, KVCacheSpec
@@ -166,6 +167,7 @@ def init_device(self):
166167
f"node_id={get_node_id()} | "
167168
f"is_driver_worker={self.is_driver_worker} | "
168169
f"hbm={utils.hbm_usage_gb(self.devices)}GiB")
170+
vllm_utils.report_usage_stats(self.vllm_config)
169171

170172
def determine_available_memory(self) -> int:
171173
gpu_memory_utilization = self.cache_config.gpu_memory_utilization

0 commit comments

Comments
 (0)