mirror of
https://github.com/vllm-project/vllm.git
synced 2026-06-06 00:16:14 +00:00
[Metrics] Exclude KV transfer tokens from iteration_tokens_total (#43346)
Signed-off-by: Tyler Michael Smith <tlrmchlsmth@gmail.com> Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
This commit is contained in:
committed by
GitHub
parent
5dbf1605a0
commit
38b864d81d
@@ -1161,7 +1161,8 @@ class PrometheusStatLogger(AggregateStatLoggerBase):
|
||||
iteration_stats.num_generation_tokens
|
||||
)
|
||||
self.histogram_iteration_tokens[engine_idx].observe(
|
||||
iteration_stats.num_prompt_tokens + iteration_stats.num_generation_tokens
|
||||
iteration_stats.prompt_token_stats.computed
|
||||
+ iteration_stats.num_generation_tokens
|
||||
)
|
||||
|
||||
for max_gen_tokens in iteration_stats.max_num_generation_tokens_iter:
|
||||
|
||||
Reference in New Issue
Block a user