We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c312468 commit 0b018d8Copy full SHA for 0b018d8
vllm/v1/attention/backends/rocm_attn.py
@@ -175,6 +175,7 @@ def get_kv_cache_shape(
175
block_size: int,
176
num_kv_heads: int,
177
head_size: int,
178
+ cache_dtype_str: str = "auto",
179
) -> tuple[int, ...]:
180
if block_size % 16 != 0:
181
raise ValueError("Block size must be a multiple of 16.")
0 commit comments