// Copyright 2019-2020 Yan Yan // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #pragma once #include #ifdef TV_CUDA #include #endif #include namespace tv { #ifdef TV_CUDA template struct CudaContextTimer { CudaContextTimer() { cudaDeviceSynchronize(); mCurTime = std::chrono::steady_clock::now(); } typename TimeT::rep report() { cudaDeviceSynchronize(); auto duration = std::chrono::duration_cast( std::chrono::steady_clock::now() - mCurTime); auto res = duration.count(); mCurTime = std::chrono::steady_clock::now(); return res; } template double benchmark(F &&f, int start = int(Count) * 0.3) { // std::vector times; auto res = typename TimeT::rep(); int count = 0; cudaDeviceSynchronize(); for (int i = 0; i < Count; ++i) { std::forward(f)(); auto time = report(); if (i >= start) { // times.push_back(time) res += time; count += 1; } } return res / double(count); } private: std::chrono::time_point mCurTime; }; #endif template struct CPUTimer { CPUTimer() { mCurTime = std::chrono::steady_clock::now(); } typename TimeT::rep report() { auto duration = std::chrono::duration_cast( std::chrono::steady_clock::now() - mCurTime); auto res = duration.count(); mCurTime = std::chrono::steady_clock::now(); return res; } private: std::chrono::time_point mCurTime; }; } // namespace tv