Unverified Commit 09c624ce authored by del-zhenwu's avatar del-zhenwu Committed by GitHub
Browse files

Fix typo in profile_serving.py (#183)

parent 7e0b75bb
...@@ -169,7 +169,7 @@ def main(tritonserver_addr: str, ...@@ -169,7 +169,7 @@ def main(tritonserver_addr: str,
first_token_latency_max = np.max(stats[:, 0], axis=0) first_token_latency_max = np.max(stats[:, 0], axis=0)
first_token_latency_ave = np.mean(stats[:, 0], axis=0) first_token_latency_ave = np.mean(stats[:, 0], axis=0)
throughput = np.sum(stats[:, 1], axis=0) / elapsed_time throughput = np.sum(stats[:, 1], axis=0) / elapsed_time
print(f'\n{"-" * 50}\ncocurrency: {concurrency}\n' print(f'\n{"-" * 50}\nconcurrency: {concurrency}\n'
f'elapsed_time: {elapsed_time:.2f}s\n' f'elapsed_time: {elapsed_time:.2f}s\n'
f'first_token latency(min, max, ave): ' f'first_token latency(min, max, ave): '
f'{first_token_latency_min:.2f}s, {first_token_latency_max:.2f}s, ' f'{first_token_latency_min:.2f}s, {first_token_latency_max:.2f}s, '
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment