Unverified Commit 8442f1ac authored by Daniël de Kok's avatar Daniël de Kok Committed by GitHub
Browse files

benchmark: fix prefill throughput (#2741)

parent ca4f46dd
...@@ -180,7 +180,7 @@ async fn prefill( ...@@ -180,7 +180,7 @@ async fn prefill(
let latency = start_time.elapsed(); let latency = start_time.elapsed();
// Compute throughput from latency and batch size // Compute throughput from latency and batch size
let throughput = batch_size as f64 / latency.as_secs_f64(); let throughput = (batch_size * sequence_length) as f64 / latency.as_secs_f64();
// Decode batch cannot be empty // Decode batch cannot be empty
let decode_batch = decode_batch.expect("decode_batch is None. This is a bug."); let decode_batch = decode_batch.expect("decode_batch is None. This is a bug.");
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment