100 lines
2.6 KiB
C++
100 lines
2.6 KiB
C++
/******************************************************************************
|
|
* Copyright (c) 2011-2017, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are not permitted.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
|
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
* DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY
|
|
* DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
|
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
|
|
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
|
|
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*
|
|
******************************************************************************/
|
|
|
|
#pragma once
|
|
|
|
/**
|
|
* \file
|
|
* GPU kernel timer
|
|
*/
|
|
|
|
#include <cuda_runtime.h>
|
|
|
|
#include <cutlass/util/debug.h>
|
|
|
|
namespace cutlass {
|
|
|
|
|
|
/******************************************************************************
|
|
* gpu_timer
|
|
******************************************************************************/
|
|
|
|
/**
|
|
* GPU event-based timer
|
|
*/
|
|
struct gpu_timer
|
|
{
|
|
cudaEvent_t _start;
|
|
cudaEvent_t _stop;
|
|
|
|
gpu_timer()
|
|
{
|
|
CUDA_PERROR_EXIT(cudaEventCreate(&_start));
|
|
CUDA_PERROR_EXIT(cudaEventCreate(&_stop));
|
|
}
|
|
|
|
~gpu_timer()
|
|
{
|
|
CUDA_PERROR_EXIT(cudaEventDestroy(_start));
|
|
CUDA_PERROR_EXIT(cudaEventDestroy(_stop));
|
|
}
|
|
|
|
void start()
|
|
{
|
|
CUDA_PERROR_EXIT(cudaEventRecord(_start, 0));
|
|
}
|
|
|
|
void stop()
|
|
{
|
|
CUDA_PERROR_EXIT(cudaEventRecord(_stop, 0));
|
|
}
|
|
|
|
float elapsed_millis()
|
|
{
|
|
float elapsed = 0.0;
|
|
CUDA_PERROR_EXIT(cudaEventSynchronize(_stop));
|
|
CUDA_PERROR_EXIT(cudaEventElapsedTime(&elapsed, _start, _stop));
|
|
return elapsed;
|
|
}
|
|
};
|
|
|
|
|
|
/******************************************************************************
|
|
* sleep_millis
|
|
******************************************************************************/
|
|
|
|
#ifdef _WIN32
|
|
#include <windows.h>
|
|
|
|
void sleep_millis(unsigned milliseconds)
|
|
{
|
|
Sleep(milliseconds);
|
|
}
|
|
#else
|
|
#include <unistd.h>
|
|
|
|
void sleep_millis(unsigned milliseconds)
|
|
{
|
|
usleep(milliseconds * 1000); // takes microseconds
|
|
}
|
|
#endif
|
|
|
|
|
|
} // namespace cutlass
|