Unverified Commit 1c304aa9 authored by Nicolas Castet's avatar Nicolas Castet Committed by GitHub
Browse files

Log iteration # for prefill and decode (#9366)

parent 770529a7
...@@ -123,7 +123,7 @@ class SchedulerMetricsMixin: ...@@ -123,7 +123,7 @@ class SchedulerMetricsMixin:
token_usage_msg = f"token usage: {token_usage:.2f}, " token_usage_msg = f"token usage: {token_usage:.2f}, "
f = ( f = (
f"Prefill batch. " f"Prefill batch [{self.forward_ct + 1}], "
f"#new-seq: {len(can_run_list)}, " f"#new-seq: {len(can_run_list)}, "
f"#new-token: {adder.log_input_tokens}, " f"#new-token: {adder.log_input_tokens}, "
f"#cached-token: {adder.log_hit_tokens}, " f"#cached-token: {adder.log_hit_tokens}, "
...@@ -246,7 +246,7 @@ class SchedulerMetricsMixin: ...@@ -246,7 +246,7 @@ class SchedulerMetricsMixin:
gap_latency / self.server_args.decode_log_interval gap_latency / self.server_args.decode_log_interval
) )
msg = f"Decode batch. #running-req: {num_running_reqs}, {token_usage_msg}" msg = f"Decode batch [{self.forward_ct}], #running-req: {num_running_reqs}, {token_usage_msg}"
if self.spec_algorithm.is_none(): if self.spec_algorithm.is_none():
spec_accept_length = 0 spec_accept_length = 0
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment