diff --git a/kernels/linear.cl b/kernels/linear.cl index 410b610..6d7a1c0 100644 --- a/kernels/linear.cl +++ b/kernels/linear.cl @@ -84,7 +84,7 @@ void largeMV(const int n, const int m, __global float* y, __global float* A, __g if (z == 0) { y[i + t] = 0; } - Q[id] = 0; + //Q[id] = 0; for (size_t j = 0; j < n; j += T) { // oszlop kezdete ahol a modul van //Q[t * Z + z] += A[(j + z) + (i + t) * m] * x[i + t]; @@ -92,7 +92,7 @@ void largeMV(const int n, const int m, __global float* y, __global float* A, __g barrier(CLK_LOCAL_MEM_FENCE); for (size_t s = Z / 2; s > 0; s >>= 1) { - if (t < s) { + if (z < s) { Q[t * Z + z] = Q[t * Z + z] + Q[t * Z + z + s]; } barrier(CLK_LOCAL_MEM_FENCE);