Mark McGranaghan 8d31ec147c move to vendor
2012-11-17 08:21:42 -08:00

37 lines
776 B
Plaintext

#include <stdio.h>
// __device__ function
__device__ void func()
{
short* array0 = (short*)array;
float* array1 = (float*)&array0[127];
}
/* __global__ function */
__global__ static void reduction(const float* __restrict__ input, float *output, clock_t *timer)
{
// __shared__ float shared[2 * blockDim.x];
extern __shared__ float shared[];
const int tid = threadIdx.x;
const int bid = blockIdx.x;
if (threadIdx.x == 0) {
__threadfence();
}
// Perform reduction to find minimum.
for (int d = blockDim.x; d > 0; d /= 2)
{
__syncthreads();
}
}
int main(int argc, char **argv)
{
dim3 dimBlock(8, 8, 1);
timedReduction<<<dimBlock, 256, 256, 0>>>(dinput, doutput, dtimer);
cudaDeviceReset();
}