TensorRT-LLMs/tests/unittest/llmapi/fake.sh
Kaiyu Xie dfbcb543ce
doc: fix path after examples migration (#3814)
Signed-off-by: Kaiyu Xie <26294424+kaiyux@users.noreply.github.com>
2025-04-24 02:36:45 +08:00

19 lines
387 B
Bash

#!/bin/bash
set -ex
hf_model_dir=$1
engine_dir=$2
# fake a 1-layer LLaMA model for CI
python3 ../../examples/models/core/llama/build.py \
--use_gemm_plugin \
--enable_context_fmha \
--use_gpt_attention_plugin \
--paged_kv_cache \
--remove_input_padding \
--n_layer 1 \
--dtype float16 \
--output_dir $engine_dir
cp $hf_model_dir/tokenizer* $engine_dir