Skip to content

Commit b529717

Browse files
authored
Print KV Cache available memory and block memory usage in GB format (#4148)
1 parent 2adca04 commit b529717

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

fastdeploy/worker/worker_process.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -382,7 +382,7 @@ def initialize_kv_cache(self) -> None:
382382
if num_blocks_local > 40000:
383383
logger.info(f"------- Reset num_blocks_local {num_blocks_local} to 40000")
384384
num_blocks_local = min(40000, num_blocks_local)
385-
logger.info(f"------- model_block_memory_used:{model_block_memory_used} --------")
385+
logger.info(f"------- model_block_memory_used:{model_block_memory_used / 1024**3} GB --------")
386386
logger.info(f"------- num_blocks_local:{num_blocks_local} --------")
387387

388388
if num_blocks_local <= 0:

0 commit comments

Comments
 (0)