mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
* feat: Variable-Beam-Width-Search Part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part2, fix CPP tests Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part3, simplify CPP tests Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search Part4, move beam_width_array param Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search, fix CI error Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2 Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2, fix pre-commit Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> * feat: Variable-Beam-Width-Search part2, fix review Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> --------- Signed-off-by: wili-65535 <wili-65535@user.noreply.github.com> Co-authored-by: wili-65535 <wili-65535@user.noreply.github.com> |
||
|---|---|---|
| .. | ||
| banWordsLayer.cpp | ||
| banWordsLayer.h | ||
| baseLayer.h | ||
| beamSearchLayer.cu | ||
| beamSearchLayer.h | ||
| CMakeLists.txt | ||
| decodingLayer.cpp | ||
| decodingLayer.h | ||
| decodingParams.h | ||
| dynamicDecodeLayer.cpp | ||
| dynamicDecodeLayer.h | ||
| eagleDecodingLayer.cpp | ||
| eagleDecodingLayer.h | ||
| explicitDraftTokensLayer.cpp | ||
| explicitDraftTokensLayer.h | ||
| externalDraftTokensLayer.cpp | ||
| externalDraftTokensLayer.h | ||
| layersFactory.h | ||
| layerUtils.h | ||
| lookaheadAlgorithm.cpp | ||
| lookaheadAlgorithm.h | ||
| lookaheadDecodingLayer.cpp | ||
| lookaheadDecodingLayer.h | ||
| lookaheadDecodingUtils.h | ||
| lookaheadPoolManager.cpp | ||
| lookaheadPoolManager.h | ||
| medusaDecodingLayer.cpp | ||
| medusaDecodingLayer.h | ||
| penaltyLayer.cpp | ||
| penaltyLayer.h | ||
| samplingLayer.cpp | ||
| samplingLayer.h | ||
| stopCriteriaLayer.cpp | ||
| stopCriteriaLayer.h | ||
| topKSamplingLayer.cpp | ||
| topKSamplingLayer.h | ||
| topPSamplingLayer.cpp | ||
| topPSamplingLayer.h | ||