mirror of
https://github.com/vllm-project/vllm.git
synced 2026-06-06 00:16:14 +00:00
3e77036768
Signed-off-by: Andreas Karatzas <akaratza@amd.com>
7 lines
211 B
YAML
7 lines
211 B
YAML
model_name: "nm-testing/Qwen1.5-MoE-A2.7B-Chat-quantized.w4a16"
|
|
accuracy_threshold: 0.45
|
|
num_questions: 1319
|
|
num_fewshot: 5
|
|
rocm_request_timeout_seconds: 1800
|
|
server_args: "--enforce-eager --max-model-len 4096"
|