Searched refs:TF_RED_WARPSIZE (Results 1 – 3 of 3) sorted by relevance
206 assert(blockDim.x % TF_RED_WARPSIZE == 0);207 int warps_per_block = blockDim.x / TF_RED_WARPSIZE;208 int warp_index = threadIdx.x / TF_RED_WARPSIZE;210 const int lane = threadIdx.x % TF_RED_WARPSIZE;223 col += TF_RED_WARPSIZE;224 for (; col < num_cols; col += TF_RED_WARPSIZE) {234 WarpReduce(temp_storage).Reduce(sum, op, min(num_cols, TF_RED_WARPSIZE));273 int rows_per_warp = TF_RED_WARPSIZE / num_cols;275 const int lane = threadIdx.x % TF_RED_WARPSIZE;295 partial_sums_raw[TF_RED_WARPSIZE * (TF_RED_WARPSIZE + 1) *[all …]
29 #define TF_RED_WARPSIZE 32 macro31 #define TF_RED_WARPSIZE 64 macro
321 TF_EXPECT_OK(GpuLaunchKernel(GpuShuffleGetSrcLaneTest, 1, TF_RED_WARPSIZE, 0, in TEST()