Home
last modified time | relevance | path

Searched refs:TF_RED_WARPSIZE (Results 1 – 3 of 3) sorted by relevance

/external/tensorflow/tensorflow/core/kernels/
Dreduction_gpu_kernels.cu.h206 assert(blockDim.x % TF_RED_WARPSIZE == 0);
207 int warps_per_block = blockDim.x / TF_RED_WARPSIZE;
208 int warp_index = threadIdx.x / TF_RED_WARPSIZE;
210 const int lane = threadIdx.x % TF_RED_WARPSIZE;
223 col += TF_RED_WARPSIZE;
224 for (; col < num_cols; col += TF_RED_WARPSIZE) {
234 WarpReduce(temp_storage).Reduce(sum, op, min(num_cols, TF_RED_WARPSIZE));
273 int rows_per_warp = TF_RED_WARPSIZE / num_cols;
275 const int lane = threadIdx.x % TF_RED_WARPSIZE;
295 partial_sums_raw[TF_RED_WARPSIZE * (TF_RED_WARPSIZE + 1) *
[all …]
/external/tensorflow/tensorflow/core/util/
Dgpu_kernel_helper.h29 #define TF_RED_WARPSIZE 32 macro
31 #define TF_RED_WARPSIZE 64 macro
Dgpu_kernel_helper_test.cu.cc321 TF_EXPECT_OK(GpuLaunchKernel(GpuShuffleGetSrcLaneTest, 1, TF_RED_WARPSIZE, 0, in TEST()