|
common.h
|
Update TensorRT-LLM (#708)
|
2023-12-20 16:38:28 +08:00 |
|
enabled.h
|
Updates for release/0.5.0
|
2023-10-15 21:26:20 +08:00 |
|
kernel.h
|
Update TensorRT-LLM (#708)
|
2023-12-20 16:38:28 +08:00 |
|
kernelLauncher.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
kernelLauncher.h
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
utility.h
|
Update code
|
2023-09-28 09:00:05 -07:00 |
|
weightOnlyBatchedGemvBs1Int4b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
weightOnlyBatchedGemvBs1Int8b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
weightOnlyBatchedGemvBs2Int4b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
weightOnlyBatchedGemvBs2Int8b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
weightOnlyBatchedGemvBs3Int4b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
weightOnlyBatchedGemvBs3Int8b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
weightOnlyBatchedGemvBs4Int4b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |
|
weightOnlyBatchedGemvBs4Int8b.cu
|
Update TensorRT-LLM (#506)
|
2023-11-30 16:46:22 +08:00 |