| .. |
|
sm90
|
Update TensorRT-LLM (#1098)
|
2024-02-18 15:48:08 +08:00 |
|
common.h
|
Update TensorRT-LLM (#1098)
|
2024-02-18 15:48:08 +08:00 |
|
enabled.h
|
Update TensorRT-LLM (#1098)
|
2024-02-18 15:48:08 +08:00 |
|
kernel.h
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
kernelLauncher.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
kernelLauncher.h
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
utility.h
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs1Int4b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs1Int8b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs2Int4b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs2Int8b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs3Int4b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs3Int8b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs4Int4b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |
|
weightOnlyBatchedGemvBs4Int8b.cu
|
Update TensorRT-LLM (#787)
|
2024-01-02 17:54:32 +08:00 |