Tests: Simplify CUDA kernels avoid crash with nvidia driver 550

Avoid having two identical kernels in PTX.  We don't need a second
kernel anyway.
This commit is contained in:
Robert Maynard 2024-10-17 14:45:57 -04:00 committed by Brad King
parent cb981c3b00
commit ee9e2216ec

View File

@ -5,10 +5,3 @@ __global__ void kernelA(float* r, float* x, float* y, float* z, int size)
r[i] = x[i] * y[i] + z[i];
}
}
__global__ void kernelB(float* r, float* x, float* y, float* z, int size)
{
for (int i = threadIdx.x; i < size; i += blockDim.x) {
r[i] = x[i] * y[i] + z[i];
}
}