|
|
@ -2,8 +2,32 @@ |
|
|
|
#include "OpenCLHandler.h" |
|
|
|
#include <iostream> |
|
|
|
|
|
|
|
void OpenCLHandler::printTimeStats(cl::Event& event) |
|
|
|
{ |
|
|
|
cl_int err = CL_SUCCESS; |
|
|
|
event.wait(); |
|
|
|
cl_ulong execStart, execEnd; |
|
|
|
execStart = event.getProfilingInfo<CL_PROFILING_COMMAND_START>(&err); |
|
|
|
if (err != CL_SUCCESS) |
|
|
|
{ |
|
|
|
std::cerr << "Error during profile query: CL_PROFILING_COMMAND_START [" |
|
|
|
<< err << "]." << std::endl; |
|
|
|
} |
|
|
|
execEnd = event.getProfilingInfo<CL_PROFILING_COMMAND_END>(&err); |
|
|
|
if (err != CL_SUCCESS) |
|
|
|
{ |
|
|
|
std::cerr << "Error during profile query: CL_PROFILING_COMMAND_END [" |
|
|
|
<< err << "]." << std::endl; |
|
|
|
} |
|
|
|
//std::cout << "[start] " << execStart << " [end] " << execEnd
|
|
|
|
// << " [time] " << (execEnd - execStart) / 1e+06 << "ms." << std::endl;
|
|
|
|
std::cout << "GPU [time] " << (execEnd - execStart) / 1e+06 << " ms" << |
|
|
|
std::endl; |
|
|
|
} |
|
|
|
|
|
|
|
OpenCLHandler::OpenCLHandler() |
|
|
|
{ |
|
|
|
|
|
|
|
cl_int err = CL_SUCCESS; |
|
|
|
|
|
|
|
// Get a platform ID
|
|
|
@ -15,7 +39,7 @@ OpenCLHandler::OpenCLHandler() |
|
|
|
exit(-1); |
|
|
|
} |
|
|
|
|
|
|
|
std::cout << platforms[0].getInfo<CL_PLATFORM_NAME>() << std::endl; |
|
|
|
std::cout << "Running on: " << platforms[0].getInfo<CL_PLATFORM_NAME>() << std::endl; |
|
|
|
|
|
|
|
// Create a context
|
|
|
|
cl_context_properties properties[] = |
|
|
@ -24,13 +48,14 @@ OpenCLHandler::OpenCLHandler() |
|
|
|
|
|
|
|
// Enumerate the devices
|
|
|
|
std::vector<cl::Device> devices = context.getInfo<CL_CONTEXT_DEVICES>(); |
|
|
|
std::cout << devices[0].getInfo<CL_DEVICE_GLOBAL_MEM_SIZE>() << std::endl; |
|
|
|
std::cout << "Global memory: " << devices[0].getInfo<CL_DEVICE_GLOBAL_MEM_SIZE>() << std::endl; |
|
|
|
|
|
|
|
max_workgroup_size = devices[0].getInfo<CL_DEVICE_MAX_WORK_GROUP_SIZE>(); |
|
|
|
std::cout << "Max workgroup: " << max_workgroup_size << std::endl << std::endl; |
|
|
|
|
|
|
|
// Create the command queue
|
|
|
|
cl::Event event; |
|
|
|
queue = cl::CommandQueue(context, devices[0], 0, &err); |
|
|
|
queue = cl::CommandQueue(context, devices[0], CL_QUEUE_PROFILING_ENABLE, &err); |
|
|
|
// Create the OpenCL program
|
|
|
|
std::string programSource = FileToString("../kernels/programs.cl"); |
|
|
|
program = cl::Program(context, programSource); |
|
|
@ -39,13 +64,15 @@ OpenCLHandler::OpenCLHandler() |
|
|
|
|
|
|
|
bool OpenCLHandler::run_test(TestCase* test) |
|
|
|
{ |
|
|
|
cl::Event event; |
|
|
|
cl::Event gpuEvent; |
|
|
|
|
|
|
|
test->gpu_compute(&context, &queue, &program, &event); |
|
|
|
test->gpu_compute(&context, &queue, &program, &gpuEvent); |
|
|
|
|
|
|
|
Timer::measure([&]() { |
|
|
|
test->cpu_compute(); |
|
|
|
}, 5); |
|
|
|
|
|
|
|
event.wait(); |
|
|
|
printTimeStats(gpuEvent); |
|
|
|
|
|
|
|
test->collect_results(&queue); |
|
|
|
|
|
|
|