[Bugfix] Guard for negative counter metrics to prevent crash (#10430)
Signed-off-by: Travis Johnson <tsjohnso@us.ibm.com>
This commit is contained in:
parent
74f8c2cf5f
commit
272e31c0bd
@ -1716,7 +1716,7 @@ class LLMEngine:
|
||||
# not counted (to avoid double counting)
|
||||
actual_num_batched_tokens = scheduler_outputs.num_batched_tokens # type: ignore
|
||||
|
||||
num_generation_tokens_from_prefill_groups = 0.
|
||||
num_generation_tokens_from_prefill_groups = 0
|
||||
# NOTE: if scheduler_outputs.num_prefill_groups > 0 and
|
||||
# the len of scheduler_outputs.scheduled_seq_groups is !=
|
||||
# scheduler_outputs.num_prefill_groups, this means that
|
||||
|
@ -512,6 +512,11 @@ class PrometheusStatLogger(StatLoggerBase):
|
||||
|
||||
def _log_counter(self, counter, data: Union[int, float]) -> None:
|
||||
# Convenience function for logging to counter.
|
||||
# Prevent ValueError from negative increment
|
||||
if data < 0:
|
||||
logger.warning("Skipping negative increment of %g to %s", data,
|
||||
counter)
|
||||
return
|
||||
counter.labels(**self.labels).inc(data)
|
||||
|
||||
def _log_counter_labels(self, counter, data: CollectionsCounter,
|
||||
|
Loading…
x
Reference in New Issue
Block a user