mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
Signed-off-by: Jatin Gangani <jgangani@dc2-container-xterm-014.prd.it.nvidia.com> Co-authored-by: Jatin Gangani <jgangani@dc2-container-xterm-014.prd.it.nvidia.com> |
||
|---|---|---|
| .. | ||
| deepseek-r1-deepgemm.yaml | ||
| deepseek-r1-latency.yaml | ||
| deepseek-r1-throughput.yaml | ||
| gpt-oss-120b-latency.yaml | ||
| gpt-oss-120b-throughput.yaml | ||
| llama-3.3-70b.yaml | ||
| llama-4-scout.yaml | ||
| qwen3-disagg-prefill.yaml | ||
| qwen3-next.yaml | ||
| qwen3.yaml | ||