mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
[None][ci] waive test_mamba2_chunk_scan_combined_prefill_chunking[seqlens1-8] (#7194)
Signed-off-by: junq <22017000+QiJune@users.noreply.github.com>
This commit is contained in:
parent
9c5b464fe0
commit
630e67b845
@ -369,6 +369,8 @@ def test_mamba2_chunk_scan_selective_state_update(dim, headdim, ngroups, dstate,
|
||||
(16, 20),
|
||||
])
|
||||
def test_mamba2_chunk_scan_combined_prefill_chunking(mamba_chunk_size, seqlens):
|
||||
if mamba_chunk_size == 8 and seqlens == (270, 88, 212, 203):
|
||||
pytest.skip("https://nvbugspro.nvidia.com/bug/5477332")
|
||||
dim = 1024
|
||||
headdim = 64
|
||||
ngroups = 1
|
||||
|
||||
Loading…
Reference in New Issue
Block a user