"googlemock/git@developer.sourcefind.cn:yangql/googletest.git" did not exist on "44da2b9ac5dff919966d7bf488c7058bc8563023"
Commit 8b6fb721 authored by wangpengcheng's avatar wangpengcheng
Browse files

issue/199 fix evaluation metric

parent 571e0ba0
...@@ -223,11 +223,11 @@ class InferEngine(_infinilm.InferEngine): ...@@ -223,11 +223,11 @@ class InferEngine(_infinilm.InferEngine):
f" Batchsize={initial_batch_size} Per_Batch_Input_Len={initial_seqlen} Per_Batch_New_Tokens={len(time_measurements)}\n" f" Batchsize={initial_batch_size} Per_Batch_Input_Len={initial_seqlen} Per_Batch_New_Tokens={len(time_measurements)}\n"
) )
print( print(
f" Prefill TTFT: {round(time_measurements[0], 2)}ms Throughput: {round((initial_batch_size * initial_seqlen) / time_measurements[0], 2)}tok/s\n", f" Prefill TTFT: {round(time_measurements[0] * 1000, 2)} ms Throughput: {round((initial_batch_size * initial_seqlen) / time_measurements[0], 2)} tok/s\n",
) )
if len(time_measurements) > 1: if len(time_measurements) > 1:
print( print(
f" Decode Avg ITL: {round(sum(time_measurements[1:]) * 1000 / (len(time_measurements) - 1), 2)}ms Throughput: {round((initial_batch_size * (len(time_measurements) - 1)) / sum(time_measurements[1:]), 2)}tok/s\n", f" Decode Avg ITL: {round(sum(time_measurements[1:]) * 1000 / (len(time_measurements) - 1), 2)} ms Throughput: {round((initial_batch_size * (len(time_measurements) - 1)) / sum(time_measurements[1:]), 2)} tok/s\n",
) )
return output_ids return output_ids
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment