err = clSetKernelArg(kernel,10, sizeof(float), &gate6); gpuerr(clSetKernelArg);
err = clSetKernelArg(kernel,11, sizeof(float), &gate7); gpuerr(clSetKernelArg);
+ size_t q = 2;
//Run the program
- size_t q = 32;
err = clEnqueueNDRangeKernel(cpx_mtx_command_queue, kernel, 1, NULL, (size_t[]){rowsR / 2}, &q, 0, NULL, NULL);
+
+ printf("%lu\n", CL_DEVICE_MAX_WORK_ITEM_SIZES);
+
gpuerr(clEnqueueNDRangeKernel);
//Wait for completion