mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
fix: reshape token_ids for lp in torch backend (#4239)
reshape token_ids Signed-off-by: Erin Ho <14718778+hchings@users.noreply.github.com>
This commit is contained in:
parent
035d915fea
commit
4becf32360
@ -2035,6 +2035,7 @@ class PyTorchModelEngine(ModelEngine):
|
||||
# Reshape to align w/ the shape used in the TRT backend,
|
||||
# so the same logit processors can be used across both backends.
|
||||
logits_row = logits_row.view(1, 1, -1)
|
||||
token_ids = [token_ids]
|
||||
for lp in logits_processors:
|
||||
lp_params = inspect.signature(lp).parameters
|
||||
|
||||
|
||||
Loading…
Reference in New Issue
Block a user