| .. |
|
__init__.py
|
Update TensorRT-LLM (#2873)
|
2025-03-11 21:13:42 +08:00 |
|
activation.py
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
attention.py
|
[TRTLLM-2795] feat: Add yarn support for other models in trt-flow (#3840)
|
2025-05-15 11:03:57 +08:00 |
|
cast.py
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
conv.py
|
Update TensorRT-LLM (#2873)
|
2025-03-11 21:13:42 +08:00 |
|
embedding.py
|
fix: #3137 speculative decoding and multimodal input support (#3276)
|
2025-04-09 23:40:19 +08:00 |
|
language_adapter.py
|
Update TensorRT-LLM (#2849)
|
2025-03-04 18:44:00 +08:00 |
|
linear.py
|
Update TensorRT-LLM (#2873)
|
2025-03-11 21:13:42 +08:00 |
|
lora.py
|
Update TensorRT-LLM (#2755)
|
2025-02-11 03:01:00 +00:00 |
|
mlp.py
|
Update TensorRT-LLM (#2936)
|
2025-03-18 21:25:19 +08:00 |
|
moe.py
|
[TRTLLM-3330][feat] Support DeepSeek-R1 W4A8 on Hopper (#4123)
|
2025-05-14 15:48:07 +08:00 |
|
normalization.py
|
Update TensorRT-LLM (#2849)
|
2025-03-04 18:44:00 +08:00 |
|
pooling.py
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
recurrent.py
|
Update TensorRT-LLM (#1954)
|
2024-07-16 15:30:25 +08:00 |
|
ssm.py
|
Update TensorRT-LLM (#2562)
|
2024-12-11 00:31:05 -08:00 |