We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent cd528d1 commit 39ba79cCopy full SHA for 39ba79c
vllm/v1/core/kv_cache_utils.py
@@ -819,9 +819,7 @@ def get_num_blocks(
819
available_memory: Memory available for KV cache in bytes.
820
page_size: The page size of the KV cache.
821
"""
822
-
823
num_blocks = int(available_memory // page_size // num_layers)
824
825
num_blocks = max(num_blocks, 0)
826
num_blocks = may_override_num_blocks(vllm_config, num_blocks)
827
return num_blocks
0 commit comments