Browse Source

Measurements

master
Daniel Gyulai 3 years ago
parent
commit
2cc11eff4a
  1. 21
      Common/OpenCLHandler.cpp
  2. 11
      Linear/Jacobi.cpp
  3. 7
      Linear/Large.cpp
  4. 20
      Linear/Linear.cpp
  5. 16
      Linear/LinearTests.h
  6. 7
      Linear/Reduce.cpp
  7. 8
      Linear/Simple.cpp

21
Common/OpenCLHandler.cpp

@ -7,22 +7,31 @@ void OpenCLHandler::printTimeStats(cl::Event& event)
cl_int err = CL_SUCCESS; cl_int err = CL_SUCCESS;
event.wait(); event.wait();
cl_ulong execStart, execEnd; cl_ulong execStart, execEnd;
bool success = true;
execStart = event.getProfilingInfo<CL_PROFILING_COMMAND_START>(&err); execStart = event.getProfilingInfo<CL_PROFILING_COMMAND_START>(&err);
if (err != CL_SUCCESS) if (err != CL_SUCCESS)
{ {
std::cerr << "Error during profile query: CL_PROFILING_COMMAND_START [" //std::cerr << "Error during profile query: CL_PROFILING_COMMAND_START ["
<< err << "]." << std::endl; //<< err << "]." << std::endl;
success = false;
} }
execEnd = event.getProfilingInfo<CL_PROFILING_COMMAND_END>(&err); execEnd = event.getProfilingInfo<CL_PROFILING_COMMAND_END>(&err);
if (err != CL_SUCCESS) if (err != CL_SUCCESS)
{ {
std::cerr << "Error during profile query: CL_PROFILING_COMMAND_END [" //std::cerr << "Error during profile query: CL_PROFILING_COMMAND_END ["
<< err << "]." << std::endl; //<< err << "]." << std::endl;
success = false;
} }
//std::cout << "[start] " << execStart << " [end] " << execEnd //std::cout << "[start] " << execStart << " [end] " << execEnd
// << " [time] " << (execEnd - execStart) / 1e+06 << "ms." << std::endl; // << " [time] " << (execEnd - execStart) / 1e+06 << "ms." << std::endl;
std::cout << "GPU [time] " << (execEnd - execStart) / 1e+06 << " ms" << if (success){
std::endl; std::cout << "GPU [time] " << (execEnd - execStart) / 1e+06 << " ms" <<
std::endl;
}
else {
std::cout << "GPU [time] Unavailable" << std::endl;
}
} }
OpenCLHandler::OpenCLHandler(std::string kernelcode) OpenCLHandler::OpenCLHandler(std::string kernelcode)

11
Linear/Jacobi.cpp

@ -74,9 +74,10 @@ MatrixVectorMultiplier* Jacobi::MethodFactory(MVType type, cl::Context* context,
} }
} }
Jacobi::Jacobi(MVType _type) Jacobi::Jacobi(int n, MVType _type)
{ {
type = _type; type = _type;
Jn = n;
generateLinEq(); generateLinEq();
} }
@ -88,22 +89,22 @@ void Jacobi::gpu_compute(cl::Context* context, cl::CommandQueue* queue, cl::Prog
{ {
MatrixVectorMultiplier* MVMultiplier = MethodFactory(type, context, queue, program); MatrixVectorMultiplier* MVMultiplier = MethodFactory(type, context, queue, program);
cl_ulong time = 0;
if (MVMultiplier != NULL) { if (MVMultiplier != NULL) {
int inputBuffer = 0; int inputBuffer = 0;
const int iterations = 20; const int iterations = 20;
for (int i = 0; i < iterations; ++i) { for (int i = 0; i < iterations; ++i) {
MVMultiplier->dewIt(Jn, Jn, Jx_g[(inputBuffer + 1) % 2], JA_g, Jx_g[inputBuffer], Jb_g); time += MVMultiplier->dewIt(Jn, Jn, Jx_g[(inputBuffer + 1) % 2], JA_g, Jx_g[inputBuffer], Jb_g);
printMatrix(1, Jn, Jx_g[inputBuffer]);
inputBuffer = (inputBuffer + 1) % 2; inputBuffer = (inputBuffer + 1) % 2;
//printMatrix(1, Jn, Jx_g[inputBuffer]);
} }
} }
else { else {
std::cout << "Invalid factory parameter" << std::endl; std::cout << "Invalid factory parameter" << std::endl;
exit(-1); exit(-1);
} }
std::cout << "Jacobi>" << MVMultiplier->getName() << "@" << Jn << ": " << time / 1e+06 << " ms" << std::endl;
} }

7
Linear/Large.cpp

@ -6,9 +6,10 @@ Large::Large(cl::Context* _context, cl::CommandQueue* _queue, cl::Program* _prog
context = _context; context = _context;
queue = _queue; queue = _queue;
program = _program; program = _program;
name = "Large";
} }
void Large::dewIt(int n, int m, float* y, const float* A, const float* x, const float* b) cl_ulong Large::dewIt(int n, int m, float* y, const float* A, const float* x, const float* b)
{ {
cl_int err = CL_SUCCESS; cl_int err = CL_SUCCESS;
cl::Event _event; cl::Event _event;
@ -49,6 +50,10 @@ void Large::dewIt(int n, int m, float* y, const float* A, const float* x, const
queue->enqueueNDRangeKernel(kernel, cl::NullRange, cl::NDRange(Z*T, 1), cl::NDRange(T * Z, 1), NULL, &_event); queue->enqueueNDRangeKernel(kernel, cl::NullRange, cl::NDRange(Z*T, 1), cl::NDRange(T * Z, 1), NULL, &_event);
_event.wait(); _event.wait();
cl_ulong execStart, execEnd;
execStart = _event.getProfilingInfo<CL_PROFILING_COMMAND_START>(&err);
execEnd = _event.getProfilingInfo<CL_PROFILING_COMMAND_END>(&err);
queue->enqueueReadBuffer(YBuffer, true, 0, sizeof(float) * n, y); queue->enqueueReadBuffer(YBuffer, true, 0, sizeof(float) * n, y);
return (execEnd - execStart);
} }

20
Linear/Linear.cpp

@ -60,10 +60,15 @@ int main()
capi(); capi();
//cppapi(); //cppapi();
OpenCLHandler handler("../kernels/linear.cl"); OpenCLHandler handler("../kernels/linear.cl");
//Jacobi j(MVType::ReduceMV);
//Jacobi j(MVType::SimpleMV); handler.run_test(new Jacobi(64, MVType::SimpleMV));
//Jacobi j(MVType::LargeMV); //handler.run_test(new Jacobi(64, MVType::ReduceMV));
//handler.run_test(&j); //handler.run_test(new Jacobi(64, MVType::LargeMV));
//for (int n = 256; n <= 1024; n = n * 2) {
// handler.run_test(new Jacobi(n, MVType::SimpleMV));
// handler.run_test(new Jacobi(n, MVType::LargeMV));
//}
int GAn = 4; int GAn = 4;
int GAm = 3; int GAm = 3;
@ -77,10 +82,11 @@ int main()
float GB[] = { 2, -1, 0, 1, 0, 0, float GB[] = { 2, -1, 0, 1, 0, 0,
-1, 2, -1, 0, 1, 0, -1, 2, -1, 0, 1, 0,
0, -1, 2, 0, 0, 1 }; 0, -1, 2, 0, 0, 1 };
Gauss g1(GAn, GAm, GA);
Gauss g2(GBn, GBm, GB);
Gauss g(GBn, GBm, GB); //handler.run_test(&g1);
//handler.run_test(&g2);
handler.run_test(&g);
return 0; return 0;
} }

16
Linear/LinearTests.h

@ -12,13 +12,17 @@ protected:
cl::Context* context; cl::Context* context;
cl::CommandQueue* queue; cl::CommandQueue* queue;
cl::Program* program; cl::Program* program;
std::string name;
public: public:
virtual void dewIt(int n, int m, float* y, const float* A, const float* x, const float* b) = 0; virtual cl_ulong dewIt(int n, int m, float* y, const float* A, const float* x, const float* b) = 0;
std::string getName() {
return name;
}
}; };
class Jacobi : public TestCase { class Jacobi : public TestCase {
private: private:
const int Jn = 8; int Jn;
// CPU // CPU
float* Jx_c[2] = { NULL, NULL }; float* Jx_c[2] = { NULL, NULL };
float* JA_c = NULL; float* JA_c = NULL;
@ -35,7 +39,7 @@ private:
void printMatrix(int n, int m, float* A); void printMatrix(int n, int m, float* A);
MatrixVectorMultiplier* MethodFactory(MVType type, cl::Context* context, cl::CommandQueue* queue, cl::Program* program); MatrixVectorMultiplier* MethodFactory(MVType type, cl::Context* context, cl::CommandQueue* queue, cl::Program* program);
public: public:
Jacobi(MVType type); Jacobi(int n, MVType type);
void collect_results(cl::CommandQueue* queue); void collect_results(cl::CommandQueue* queue);
void gpu_compute(cl::Context* context, cl::CommandQueue* queue, cl::Program* program, cl::Event* Event); void gpu_compute(cl::Context* context, cl::CommandQueue* queue, cl::Program* program, cl::Event* Event);
void cpu_compute(); void cpu_compute();
@ -61,17 +65,17 @@ public:
class Simple : public MatrixVectorMultiplier { class Simple : public MatrixVectorMultiplier {
public: public:
Simple(cl::Context* context, cl::CommandQueue* queue, cl::Program* program); Simple(cl::Context* context, cl::CommandQueue* queue, cl::Program* program);
void dewIt(int n, int m, float* y, const float* A, const float* x, const float* b); cl_ulong dewIt(int n, int m, float* y, const float* A, const float* x, const float* b);
}; };
class Reduce : public MatrixVectorMultiplier { class Reduce : public MatrixVectorMultiplier {
public: public:
Reduce(cl::Context* context, cl::CommandQueue* queue, cl::Program* program); Reduce(cl::Context* context, cl::CommandQueue* queue, cl::Program* program);
void dewIt(int n, int m, float* y, const float* A, const float* x, const float* b); cl_ulong dewIt(int n, int m, float* y, const float* A, const float* x, const float* b);
}; };
class Large : public MatrixVectorMultiplier { class Large : public MatrixVectorMultiplier {
public: public:
Large(cl::Context* context, cl::CommandQueue* queue, cl::Program* program); Large(cl::Context* context, cl::CommandQueue* queue, cl::Program* program);
void dewIt(int n, int m, float* y, const float* A, const float* x, const float* b); cl_ulong dewIt(int n, int m, float* y, const float* A, const float* x, const float* b);
}; };

7
Linear/Reduce.cpp

@ -6,9 +6,10 @@ Reduce::Reduce(cl::Context* _context, cl::CommandQueue* _queue, cl::Program* _pr
context = _context; context = _context;
queue = _queue; queue = _queue;
program = _program; program = _program;
name = "Reduce";
} }
void Reduce::dewIt(int n, int m, float* y, const float* A, const float* x, const float* b) cl_ulong Reduce::dewIt(int n, int m, float* y, const float* A, const float* x, const float* b)
{ {
cl_int err = CL_SUCCESS; cl_int err = CL_SUCCESS;
cl::Event _event; cl::Event _event;
@ -51,6 +52,10 @@ void Reduce::dewIt(int n, int m, float* y, const float* A, const float* x, const
NULL, // NULL, //
&_event); &_event);
_event.wait(); _event.wait();
cl_ulong execStart, execEnd;
execStart = _event.getProfilingInfo<CL_PROFILING_COMMAND_START>(&err);
execEnd = _event.getProfilingInfo<CL_PROFILING_COMMAND_END>(&err);
queue->enqueueReadBuffer(YBuffer, true, 0, sizeof(float) * n, y); queue->enqueueReadBuffer(YBuffer, true, 0, sizeof(float) * n, y);
return (execEnd - execStart);
} }

8
Linear/Simple.cpp

@ -6,12 +6,14 @@ Simple::Simple(cl::Context* _context, cl::CommandQueue* _queue, cl::Program* _pr
context = _context; context = _context;
queue = _queue; queue = _queue;
program = _program; program = _program;
name = "Simple";
} }
void Simple::dewIt(int n, int m, float* y, const float* A, const float* x, const float* b) cl_ulong Simple::dewIt(int n, int m, float* y, const float* A, const float* x, const float* b)
{ {
cl_int err = CL_SUCCESS; cl_int err = CL_SUCCESS;
cl::Event _event; cl::Event _event;
cl::Kernel kernel = cl::Kernel(*program, "simpleMV", &err); cl::Kernel kernel = cl::Kernel(*program, "simpleMV", &err);
CheckCLError(err); CheckCLError(err);
@ -46,6 +48,10 @@ void Simple::dewIt(int n, int m, float* y, const float* A, const float* x, const
NULL, // NULL, //
&_event); &_event);
_event.wait(); _event.wait();
cl_ulong execStart, execEnd;
execStart = _event.getProfilingInfo<CL_PROFILING_COMMAND_START>(&err);
execEnd = _event.getProfilingInfo<CL_PROFILING_COMMAND_END>(&err);
queue->enqueueReadBuffer(YBuffer, true, 0, sizeof(float) * n, y); queue->enqueueReadBuffer(YBuffer, true, 0, sizeof(float) * n, y);
return (execEnd - execStart);
} }

Loading…
Cancel
Save