| .. |
|
_torch
|
TensorRT-LLM v0.18 release (#3231)
|
2025-04-02 17:01:16 +08:00 |
|
auto_parallel
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
bench
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
commands
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
inputs
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
layers
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
llmapi
|
TensorRT-LLM v0.18 release (#3231)
|
2025-04-02 17:01:16 +08:00 |
|
models
|
TensorRT-LLM v0.18.1 release (#3389)
|
2025-04-09 09:06:37 +08:00 |
|
plugin
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
quantization
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
runtime
|
TensorRT-LLM v0.18 release (#3231)
|
2025-04-02 17:01:16 +08:00 |
|
serve
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
tools
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
__init__.py
|
TensorRT-LLM v0.16 Release
|
2024-12-24 15:58:43 +08:00 |
|
_common.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
_ipc_utils.py
|
TensorRT-LLM v0.13 Update (#2269)
|
2024-09-30 16:20:23 +08:00 |
|
_utils.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
builder.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
executor.py
|
TensorRT-LLM v0.18.2 release (#3611)
|
2025-04-16 14:42:50 +08:00 |
|
functional.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
graph_rewriting.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
logger.py
|
TensorRT-LLM v0.16 Release
|
2024-12-24 15:58:43 +08:00 |
|
lora_manager.py
|
TensorRT-LLM Release 0.15.0 (#2529)
|
2024-12-04 13:44:56 +08:00 |
|
mapping.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
module.py
|
Update TensorRT-LLM v0.14.0 (#2401)
|
2024-11-01 19:48:44 +08:00 |
|
network.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
parameter.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
profiler.py
|
TensorRT-LLM v0.16 Release
|
2024-12-24 15:58:43 +08:00 |
|
prompt_adapter_manager.py
|
TensorRT-LLM Release 0.15.0 (#2529)
|
2024-12-04 13:44:56 +08:00 |
|
python_plugin.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
sampling_params.py
|
open source 09df54c0cc99354a60bbc0303e3e8ea33a96bef0 (#2725)
|
2025-02-11 02:21:51 +00:00 |
|
top_model_mixin.py
|
TensorRT-LLM v0.12 Update (#2164)
|
2024-08-29 17:25:07 +08:00 |
|
version.py
|
TensorRT-LLM v0.18.2 release (#3611)
|
2025-04-16 14:42:50 +08:00 |