[https://nvbugs/5477332][fix] Relax atol in test_mamba2_chunk_scan_combined_prefill_chunking (#7215)

Signed-off-by: Amit Zuker <203509407+amitz-nv@users.noreply.github.com>
This commit is contained in:
amitz-nv 2025-08-26 10:48:58 +03:00 committed by GitHub
parent bf377d0b8e
commit 23ed0c892d
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -369,8 +369,6 @@ def test_mamba2_chunk_scan_selective_state_update(dim, headdim, ngroups, dstate,
(16, 20),
])
def test_mamba2_chunk_scan_combined_prefill_chunking(mamba_chunk_size, seqlens):
if mamba_chunk_size == 8 and seqlens == (270, 88, 212, 203):
pytest.skip("https://nvbugspro.nvidia.com/bug/5477332")
dim = 1024
headdim = 64
ngroups = 1
@ -566,7 +564,7 @@ def test_mamba2_chunk_scan_combined_prefill_chunking(mamba_chunk_size, seqlens):
# kernel chunked is same as kernel overall
# tight tolerance to find subtle correctness issues
rtol = 1e-2
atol = 2e-3
atol = 5e-3
for i in range(num_sequences):
out_seq = out[:, cu_seqlens[i]:cu_seqlens[i + 1], ...]
out_seq_ref = out_ref[:, cu_seqlens[i]:cu_seqlens[i + 1], ...]