mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-01 00:31:24 +08:00
fix cutlass moe not falling back
Signed-off-by: Xiwen Yu <13230610+VALLIS-NERIA@users.noreply.github.com>
This commit is contained in:
parent
c425c1214d
commit
0fb835d7c2
2
3rdparty/cutlass
vendored
2
3rdparty/cutlass
vendored
@ -1 +1 @@
|
||||
Subproject commit a49a78ffefc86a87160dfe0ccc3a3a2d1622c918
|
||||
Subproject commit b2dd65dc864e09688245b316ac46c4a6cd07e15c
|
||||
@ -113,6 +113,9 @@ void dispatchMoeGemmSelectBiasTmaWarpSpecialized(TmaWarpSpecializedGroupedGemmIn
|
||||
"passing 103-real as an arch to build_wheel.py.");
|
||||
first_time = false;
|
||||
}
|
||||
return dispatchMoeGemmSelectBiasTmaWarpSpecialized<cutlass::arch::Sm100, T, WeightType, OutputType, EpilogueTag,
|
||||
FUSION, TileShape, ClusterShape>(
|
||||
hopper_input, num_experts, multi_processor_count, stream, occupancy, workspace_size);
|
||||
}
|
||||
#endif
|
||||
#ifndef COMPILE_BLACKWELL_TMA_GROUPED_GEMMS
|
||||
|
||||
Loading…
Reference in New Issue
Block a user