blob: f4a52d42176e89712b5d7c09a3092a4572cd2fe4 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
|
__global__ void kernelA(float* r, float* x, float* y, float* z, int size)
{
for (int i = threadIdx.x; i < size; i += blockDim.x) {
r[i] = x[i] * y[i] + z[i];
}
}
__global__ void kernelB(float* r, float* x, float* y, float* z, int size)
{
for (int i = threadIdx.x; i < size; i += blockDim.x) {
r[i] = x[i] * y[i] + z[i];
}
}
|