Commit d5a0fda9 authored by zhuwenwen's avatar zhuwenwen
Browse files

remove performence output

parent fed04a1c
......@@ -505,9 +505,9 @@ void llama_example(const INIReader reader)
vocab_size,
((end.tv_sec - start.tv_sec) * 1000 + (end.tv_usec - start.tv_usec) * 0.001) / ite);
float total_time;
total_time = ((end.tv_sec - start.tv_sec) * 1000 + (end.tv_usec - start.tv_usec) * 0.001) / ite / 1000;
printf("[INFO] performance: %.2f tokens/sec \n", (request_batch_size * request_output_len) / total_time);
// float total_time;
// total_time = ((end.tv_sec - start.tv_sec) * 1000 + (end.tv_usec - start.tv_usec) * 0.001) / ite / 1000;
// printf("[INFO] performance: %.2f tokens/sec \n", (request_batch_size * request_output_len) / total_time);
ftNcclParamDestroy(tensor_para);
ftNcclParamDestroy(pipeline_para);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment