/* ----------------------------------------------------------------------------- * * Module : Replicate * Copyright : (c) [2009..2010] Trevor L. McDonell * License : BSD * * ---------------------------------------------------------------------------*/ extern "C" __global__ void replicate ( ArrOut d_out, const ArrIn0 d_in0, const Slice slice, const SliceDim sliceDim ) { Ix shapeSize = size(sliceDim); const Ix gridSize = __umul24(blockDim.x, gridDim.x); for (Ix ix = __umul24(blockDim.x, blockIdx.x) + threadIdx.x; ix < shapeSize; ix += gridSize) { SliceDim dst = fromIndex(sliceDim, ix); Slice src = sliceIndex(dst); set(d_out, ix, get0(d_in0, toIndex(slice, src))); } }