mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
* refactoring the multimodal input prep Signed-off-by: Rakib Hasan <rhasan@nvidia.com> * adding out-of-tree override option Signed-off-by: Rakib Hasan <rhasan@nvidia.com> * adding exceptional case for llava-next Signed-off-by: Rakib Hasan <rhasan@nvidia.com> * fixing typo Signed-off-by: Rakib Hasan <rhasan@nvidia.com> * addressing review comments, adding placement option, handling tokenizer variations Signed-off-by: Rakib Hasan <rhasan@nvidia.com> * addressing pytest-asyncio behavior change Signed-off-by: Rakib Hasan <rhasan@nvidia.com> --------- Signed-off-by: Rakib Hasan <rhasan@nvidia.com>
21 lines
450 B
INI
21 lines
450 B
INI
[pytest]
|
|
asyncio_default_fixture_loop_scope = module
|
|
threadleak = True
|
|
threadleak_exclude = asyncio_\d+
|
|
addopts = --durations=0 -W ignore::DeprecationWarning
|
|
pythonpath =
|
|
_torch/auto_deploy/_utils_test
|
|
../../examples/auto_deploy
|
|
../../examples/models/core
|
|
../../examples
|
|
env =
|
|
D:AUTO_DEPLOY_LOG_LEVEL=INFO
|
|
markers =
|
|
part0
|
|
part1
|
|
part2
|
|
part3
|
|
part4
|
|
gpu2: this test uses 2 GPUs
|
|
gpu4: this test uses 4 GPUs
|