mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
[TRTLLM-6342][bug] Patched incorrect starcoder tp config (#8118)
Signed-off-by: greg-kwasniewski1 <213329731+greg-kwasniewski1@users.noreply.github.com>
This commit is contained in:
parent
4136942436
commit
a5b59fd31d
@ -0,0 +1,4 @@
|
||||
from transformers.models.starcoder2.configuration_starcoder2 import Starcoder2Config
|
||||
|
||||
# Remove this patch after TRT-LLM upgrades to the HF transformers version >= 4.57
|
||||
Starcoder2Config.base_model_tp_plan["layers.*.mlp.c_proj"] = "rowwise"
|
||||
Loading…
Reference in New Issue
Block a user