We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent bf3ffb6 commit e0c910bCopy full SHA for e0c910b
vllm/model_executor/layers/mamba/ops/ssd_chunk_scan.py
@@ -245,7 +245,7 @@ def _chunk_scan_fwd_kernel(
245
)
246
if not HAS_INITSTATES and (seq_idx != seq_idx_prev):
247
prev_states = tl.zeros(
248
- (BLOCK_SIZE_DSTATE, BLOCK_SIZE_K), dtype=C_ptr.dtype.element_ty
+ (BLOCK_SIZE_K, BLOCK_SIZE_N), dtype=C_ptr.dtype.element_ty
249
250
else:
251
prev_states = tl.load(
0 commit comments