mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-13 22:18:36 +08:00
Signed-off-by: Ye Zhang <zhysishu@gmail.com> Signed-off-by: Shunkang <182541032+Shunkangz@users.noreply.github.co>
16 lines
377 B
Python
16 lines
377 B
Python
from enum import Enum
|
|
|
|
|
|
class MetricNames(Enum):
|
|
TTFT = "ttft"
|
|
TPOT = "tpot"
|
|
E2E = "e2e"
|
|
REQUEST_QUEUE_TIME = "request_queue_time"
|
|
|
|
|
|
class RequestEventTiming(Enum):
|
|
ARRIVAL_TIME = "arrival_time"
|
|
FIRST_TOKEN_TIME = "first_token_time" # nosec: B105
|
|
FIRST_SCHEDULED_TIME = "first_scheduled_time"
|
|
LAST_TOKEN_TIME = "last_token_time" # nosec: B105
|