mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
[https://nvbugs/5575841] [test] Move test_moe.py to serial tests to improve stability + unwaive FP4 MoE torch unit tests (#8422)
Signed-off-by: Dom Brown <3886319+DomBrown@users.noreply.github.com>
This commit is contained in:
parent
0dac57f2bc
commit
9410ce3bea
@ -991,7 +991,6 @@ class TestMoeFp4:
|
||||
the default tactic selection works. This reduces unnecessary test runs for CI
|
||||
"""
|
||||
|
||||
@pytest.mark.skip(reason="https://nvbugs/5575841")
|
||||
@pytest.mark.parametrize("num_tokens", [1, 1024])
|
||||
@pytest.mark.parametrize("hidden_size", [1024])
|
||||
@pytest.mark.parametrize("intermediate_size", [1024, 768, 384, 192])
|
||||
@ -1078,7 +1077,6 @@ class TestMoeFp4:
|
||||
use_autotune=True,
|
||||
use_topk_as_input=False)
|
||||
|
||||
@pytest.mark.skip(reason="https://nvbugs/5575841")
|
||||
@pytest.mark.parametrize("num_tokens", [1, 150])
|
||||
@pytest.mark.parametrize("hidden_size", [1024])
|
||||
@pytest.mark.parametrize("intermediate_size", [1024])
|
||||
Loading…
Reference in New Issue
Block a user