TensorRT-LLMs/examples/serve/aiperf_client_for_multimodal.sh
Yechan Kim 36cb5f8c93
[https://nvbugs/5747920][fix] Fix multimodal serve test (#11296)
Signed-off-by: yechank <161688079+yechank-nvidia@users.noreply.github.com>
2026-02-05 15:12:53 +09:00

20 lines
559 B
Bash

#! /usr/bin/env bash
aiperf profile \
-m Qwen2.5-VL-3B-Instruct \
--tokenizer ${AIPERF_TOKENIZER_PATH:-Qwen/Qwen2.5-VL-3B-Instruct} \
--endpoint-type chat \
--random-seed 123 \
--image-width-mean 64 \
--image-height-mean 64 \
--image-format png \
--synthetic-input-tokens-mean 128 \
--synthetic-input-tokens-stddev 0 \
--output-tokens-mean 128 \
--output-tokens-stddev 0 \
--request-count 5 \
--request-rate 1 \
--profile-export-file my_profile_export.json \
--url localhost:8000 \
--streaming