__global__ void incKernel(int *g_out, int *g_in, int N, int inner_reps)
{
00402070 push ebp
00402071 mov ebp,esp
00402073 mov eax,dword ptr [__cuda_3]
00402076 push eax
00402077 mov ecx,dword ptr [__cuda_2]
0040207A push ecx
0040207B mov edx,dword ptr [__cuda_1]
0040207E push edx
0040207F mov eax,dword ptr [__cuda_0]
00402082 push eax
00402083 call __device_stub__Z9incKernelPiS_ii (401FE0h)
00402088 add esp,10h
int idx = blockIdx.x * blockDim.x + threadIdx.x;
if( idx < N ) {
for( int i=0; i<inner_reps; ++i ) {
//g_out[idx] = g_in[idx] + 1;
g_out[idx] = i+1;
}
}
}
0040208B pop ebp
0040208C ret