mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
* support lp in pytorch backend Signed-off-by: Erin Ho <14718778+hchings@users.noreply.github.com> * fix tp Signed-off-by: Erin Ho <14718778+hchings@users.noreply.github.com> --------- Signed-off-by: Erin Ho <14718778+hchings@users.noreply.github.com>
21 lines
481 B
YAML
21 lines
481 B
YAML
methods:
|
|
__call__:
|
|
parameters:
|
|
client_id:
|
|
annotation: Optional[int]
|
|
default: inspect._empty
|
|
logits:
|
|
annotation: torch.Tensor
|
|
default: inspect._empty
|
|
req_id:
|
|
annotation: int
|
|
default: inspect._empty
|
|
stream_ptr:
|
|
annotation: Optional[int]
|
|
default: inspect._empty
|
|
token_ids:
|
|
annotation: List[List[int]]
|
|
default: inspect._empty
|
|
return_annotation: None
|
|
properties: {}
|