We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 723bf67 commit 1c69959Copy full SHA for 1c69959
vllm/v1/attention/backends/rocm_aiter_unified_attn.py
@@ -176,7 +176,10 @@ def forward(
176
max_seqlen_k = attn_metadata.max_seq_len
177
block_table = attn_metadata.block_table
178
179
- descale_shape = (cu_seqlens_q.shape[0] - 1, key.shape[1] if key is not None else self.num_kv_heads)
+ descale_shape = (
180
+ cu_seqlens_q.shape[0] - 1,
181
+ key.shape[1] if key is not None else self.num_kv_heads,
182
+ )
183
184
self.unified_attention(
185
q=query[:num_actual_tokens],
0 commit comments