mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-29 23:23:48 +08:00
35 lines
1020 B
YAML
35 lines
1020 B
YAML
methods:
|
|
__init__:
|
|
parameters:
|
|
cumulative_logprob:
|
|
annotation: Optional[float]
|
|
default: null
|
|
disaggregated_params:
|
|
annotation: Optional[tensorrt_llm.disaggregated_params.DisaggregatedParams]
|
|
default: null
|
|
request_perf_metrics:
|
|
annotation: Optional[tensorrt_llm.bindings.executor.RequestPerfMetrics]
|
|
default: null
|
|
additional_context_outputs:
|
|
annotation: Optional[Dict[str, torch.Tensor]]
|
|
default: null
|
|
status: prototype
|
|
additional_generation_outputs:
|
|
annotation: Optional[Dict[str, torch.Tensor]]
|
|
default: null
|
|
status: prototype
|
|
return_annotation: None
|
|
properties:
|
|
length:
|
|
annotation: int
|
|
default: inspect._empty
|
|
logprobs_diff:
|
|
annotation: list[dict[int, tensorrt_llm.executor.result.Logprob]] | List[float]
|
|
default: inspect._empty
|
|
text_diff:
|
|
annotation: str
|
|
default: inspect._empty
|
|
token_ids_diff:
|
|
annotation: List[int]
|
|
default: inspect._empty
|