mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-22 19:52:38 +08:00
Signed-off-by: Chang Liu <9713593+chang-l@users.noreply.github.com> Signed-off-by: Chang Liu (Enterprise Products) <9713593+chang-l@users.noreply.github.com>
33 lines
837 B
YAML
33 lines
837 B
YAML
methods:
|
|
aresult:
|
|
parameters: {}
|
|
return_annotation: tensorrt_llm.executor.result.GenerationResult
|
|
result:
|
|
parameters:
|
|
timeout:
|
|
annotation: Optional[float]
|
|
default: None
|
|
return_annotation: tensorrt_llm.executor.result.GenerationResult
|
|
properties:
|
|
request_id:
|
|
annotation: int
|
|
default: inspect._empty
|
|
prompt:
|
|
annotation: Optional[str]
|
|
default: inspect._empty
|
|
prompt_token_ids:
|
|
annotation: List[int]
|
|
default: inspect._empty
|
|
outputs:
|
|
annotation: List[tensorrt_llm.executor.result.CompletionOutput]
|
|
default: inspect._empty
|
|
context_logits:
|
|
annotation: Optional[torch.Tensor]
|
|
default: inspect._empty
|
|
finished:
|
|
annotation: bool
|
|
default: inspect._empty
|
|
mm_embedding_handle:
|
|
annotation: Optional[Dict[str, Any]]
|
|
default: inspect._empty
|