mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
| .. | ||
| xqa_kernel_cubin.h | ||
| xqa_kernel_dt_fp16_d_128_beam_1_kvt_fp16_nqpkv_8_sm_80.cubin.cpp | ||
| xqa_kernel_dt_fp16_d_128_beam_1_kvt_fp16_nqpkv_8_sm_86.cubin.cpp | ||
| xqa_kernel_dt_fp16_d_128_beam_1_kvt_fp16_nqpkv_8_sm_89.cubin.cpp | ||
| xqa_kernel_dt_fp16_d_128_beam_1_kvt_fp16_nqpkv_8_sm_90.cubin.cpp | ||