mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
[None][chore] remove out-of-date comment in star attention test (#6773)
Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com>
This commit is contained in:
parent
864ddb3289
commit
0326ea3698
@ -53,7 +53,6 @@ def similarity_score(a, b):
|
||||
return SequenceMatcher(None, a, b).ratio()
|
||||
|
||||
|
||||
# Generate the outputs using either TRT or PyTorch (based on the use_pytorch argument). It’s the same function for both workflows.
|
||||
def generate_llm_outputs(args, data, fp8=False, fp8_kv_cache=False):
|
||||
kv_cache_config = KvCacheConfig(dtype="fp8" if fp8_kv_cache else "auto")
|
||||
cp_config = {
|
||||
|
||||
Loading…
Reference in New Issue
Block a user