mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-13 22:18:36 +08:00
Signed-off-by: yifei.w <yifei.w@bytedance.com>
This commit is contained in:
parent
fded6c393d
commit
9d1f2a9925
@ -473,6 +473,7 @@ class ModelRunnerMixin:
|
||||
prompt_table,
|
||||
torch.Tensor), "Prompt table should be str or torch.Tensor"
|
||||
prompt_table_data = prompt_table.to(dtype=self.dtype)
|
||||
torch.cuda.current_stream().synchronize()
|
||||
|
||||
return prompt_table_data
|
||||
|
||||
|
||||
Loading…
Reference in New Issue
Block a user