mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-23 20:23:08 +08:00
* feat: Variable-Beam-Width-Search Part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part2, fix CPP tests Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part3, simplify CPP tests Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part4, move beam_width_array param Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search, fix CI error Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2, fix pre-commit Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2, fix review Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> --------- Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> Co-authored-by: wili-65535 <wili-65535@user.noreply.github.com>
32 lines
833 B
YAML
32 lines
833 B
YAML
methods:
|
|
__init__:
|
|
parameters:
|
|
# Experimental features
|
|
additional_model_outputs:
|
|
annotation: Optional[List[tensorrt_llm.sampling_params.AdditionalModelOutput]]
|
|
default: null
|
|
return_perf_metrics:
|
|
annotation: bool
|
|
default: false
|
|
# TODO [TRTLLM-3716]: Deprecated arguments
|
|
beam_width:
|
|
annotation: int
|
|
default: 1
|
|
max_new_tokens:
|
|
annotation: Optional[int]
|
|
default: null
|
|
min_length:
|
|
annotation: Optional[int]
|
|
default: null
|
|
num_return_sequences:
|
|
annotation: Optional[int]
|
|
default: null
|
|
random_seed:
|
|
annotation: Optional[int]
|
|
default: null
|
|
beam_width_array:
|
|
annotation: Optional[List[int]]
|
|
default: null
|
|
return_annotation: None
|
|
properties: {}
|