TensorRT-LLMs/tests/hlapi/test_llm_download.py
Kaiyu Xie bca9a33b02
Update TensorRT-LLM (#2008)
* Update TensorRT-LLM

---------

Co-authored-by: Timur Abishev <abishev.timur@gmail.com>
Co-authored-by: MahmoudAshraf97 <hassouna97.ma@gmail.com>
Co-authored-by: Saeyoon Oh <saeyoon.oh@furiosa.ai>
Co-authored-by: hattizai <hattizai@gmail.com>
2024-07-23 23:05:09 +08:00

38 lines
998 B
Python

from tensorrt_llm.hlapi import LLM
from tensorrt_llm.hlapi.utils import (download_hf_model,
download_hf_pretrained_config)
try:
from .test_llm import llama_model_path
except ImportError:
from .test_llm import llama_model_path
prompts = ["A B C"]
model_name = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
def test_llm_with_model_downloaded():
llm = LLM(model=model_name, enable_build_cache=True)
for output in llm.generate(prompts):
print(output)
def test_llm_with_tokenizer_downloaded():
llm = LLM(model=llama_model_path, tokenizer=model_name)
for output in llm.generate(prompts):
print(output)
def test_download_config():
path0 = download_hf_pretrained_config(model_name)
print(f"download config to {path0}")
path1 = download_hf_model(model_name)
print(f"download model to {path1}")
assert path0 == path1
if __name__ == "__main__":
test_download_config()
test_llm_with_model_downloaded()