mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
Refine attention backend interface. Signed-off-by: Yuxian Qiu <142763828+yuxianq@users.noreply.github.com>
19 lines
375 B
INI
19 lines
375 B
INI
[pytest]
|
|
threadleak = True
|
|
threadleak_exclude = asyncio_\d+
|
|
addopts = --durations=0 -W ignore::DeprecationWarning
|
|
pythonpath =
|
|
_torch/auto_deploy/_utils_test
|
|
../../examples/auto_deploy
|
|
../../examples
|
|
env =
|
|
D:AUTO_DEPLOY_LOG_LEVEL=INFO
|
|
markers =
|
|
part0
|
|
part1
|
|
part2
|
|
part3
|
|
part4
|
|
gpu2: this test uses 2 GPUs
|
|
gpu4: this test uses 4 GPUs
|