Tests: Simplify CUDA kernels avoid crash with nvidia driver 550
Avoid having two identical kernels in PTX. We don't need a second kernel anyway.
This commit is contained in:
parent
cb981c3b00
commit
ee9e2216ec
@ -5,10 +5,3 @@ __global__ void kernelA(float* r, float* x, float* y, float* z, int size)
|
||||
r[i] = x[i] * y[i] + z[i];
|
||||
}
|
||||
}
|
||||
|
||||
__global__ void kernelB(float* r, float* x, float* y, float* z, int size)
|
||||
{
|
||||
for (int i = threadIdx.x; i < size; i += blockDim.x) {
|
||||
r[i] = x[i] * y[i] + z[i];
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user