mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-05 02:31:33 +08:00
Signed-off-by: Stefan Niebler <82932102+stnie@users.noreply.github.com> Signed-off-by: Yuan Tong <13075180+tongyuantongyu@users.noreply.github.com> Signed-off-by: Erin Ho <14718778+hchings@users.noreply.github.com> Co-authored-by: Yuan Tong <13075180+tongyuantongyu@users.noreply.github.com> Co-authored-by: Erin Ho <14718778+hchings@users.noreply.github.com> |
||
|---|---|---|
| .. | ||
| __init__.py | ||
| auto_heuristic.py | ||
| drafter.py | ||
| drafting_loops.py | ||
| eagle3.py | ||
| interface.py | ||
| model_drafter.py | ||
| mtp.py | ||
| ngram.py | ||
| one_model_sampler.py | ||
| save_hidden_state.py | ||
| spec_tree_manager.py | ||
| speculation_gate.py | ||
| utils.py | ||