mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
waive test_moe.py::test_moe_fp8[autotune] (#5455)
Signed-off-by: QI JUN <22017000+QiJune@users.noreply.github.com>
This commit is contained in:
parent
699520082b
commit
241f921800
@ -579,7 +579,8 @@ def quant_dequant_per_tensor_fp8(a):
|
||||
ids=["autotune", "no_autotune"])
|
||||
def test_moe_fp8(num_tokens, expert_info, hidden_size, intermediate_size,
|
||||
use_autotune):
|
||||
|
||||
if use_autotune:
|
||||
pytest.skip("https://nvbugs/5356427")
|
||||
torch.random.manual_seed(0)
|
||||
|
||||
#
|
||||
|
||||
Loading…
Reference in New Issue
Block a user