mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-26 21:53:30 +08:00
22 lines
604 B
YAML
22 lines
604 B
YAML
model:
|
|
model_type: llm
|
|
llm_type: openai-apicompatible
|
|
llm_name: <llm-name>
|
|
container: null
|
|
use_cache: false
|
|
use_chat_endpoint: false
|
|
is_hf_model: false
|
|
tokenizer_path: <tokenizer-path>
|
|
base_url: http://localhost:12478/v1
|
|
|
|
evaluations:
|
|
-
|
|
eval_type: automatic
|
|
eval_subtype: bigcode_latest
|
|
native_args: ""
|
|
standard_tasks: [humaneval]
|
|
mbpp_task_args: ""
|
|
humaneval_task_args: "--max_length_generation=768 --batch_size=1 --top_k=1 --top_p=0.00001 --temperature=0.00001 --n_samples=1 --num_chunks=1"
|
|
transcoder_cpp_task_args: ""
|
|
transcoder_java_task_args: ""
|