| .. |
|
auto_deploy
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
compilation
|
Update (#2978)
|
2025-03-23 16:39:35 +08:00 |
|
modeling
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
multi_gpu
|
None - Add one-shot version for UB AR NORM FP16/BF16 (#2995)
|
2025-03-31 11:16:03 +08:00 |
|
multi_gpu_modeling
|
move BuildConfig functional args to llmargs (#3036)
|
2025-03-29 02:20:18 +08:00 |
|
speculative
|
Add initial EAGLE-3 implementation (#3035)
|
2025-03-29 22:31:24 +08:00 |
|
thop
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
helpers.py
|
Update TensorRT-LLM (#2936)
|
2025-03-18 21:25:19 +08:00 |
|
pattern_watcher.py
|
Update TensorRT-LLM (#2936)
|
2025-03-18 21:25:19 +08:00 |
|
test_attention.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_autotuner.py
|
Update (#2978)
|
2025-03-23 16:39:35 +08:00 |
|
test_flashinfer_attention.py
|
Update (#2978)
|
2025-03-23 16:39:35 +08:00 |
|
test_flashinfer_star_attn.py
|
Update (#2978)
|
2025-03-23 16:39:35 +08:00 |
|
test_fp4_bmm_quantize.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_fp4_gemm_quantize.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_fp4_linear.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_fp8_block_scale_gemm.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_fp8_linear.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_fp8_quantize.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_fused_moe.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_moe_routing.py
|
Update TensorRT-LLM (#2936)
|
2025-03-18 21:25:19 +08:00 |
|
test_moe.py
|
test: reorganize tests folder hierarchy (#2996)
|
2025-03-27 12:07:53 +08:00 |
|
test_overlap_scheduler_input.json
|
Update TensorRT-LLM (#2936)
|
2025-03-18 21:25:19 +08:00 |
|
test_overlap_scheduler.py
|
Update TensorRT-LLM (#2936)
|
2025-03-18 21:25:19 +08:00 |
|
test_pytorch_model_engine.py
|
Update (#2978)
|
2025-03-23 16:39:35 +08:00 |
|
test_vanilla_attention.py
|
Update (#2978)
|
2025-03-23 16:39:35 +08:00 |