Home
last modified time | relevance | path

Searched refs:virtual_thread_count (Results 1 – 25 of 25) sorted by relevance

/external/tensorflow/tensorflow/contrib/reduce_slice_ops/kernels/
Dreduce_slice_ops_gpu.cu.cc42 CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) { \
43 CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) { \
44 CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count.z, Z) { \
45 Index outidx = x * config.virtual_thread_count.y * \
46 config.virtual_thread_count.z + \
47 y * config.virtual_thread_count.z + z; \
52 Index inidx = x * bound * config.virtual_thread_count.z + \
53 yin * config.virtual_thread_count.z + z; \
/external/tensorflow/tensorflow/core/util/
Dcuda_launch_config.h114 int virtual_thread_count = -1; member
129 const int virtual_thread_count = work_element_count; in GetCudaLaunchConfig() local
132 virtual_thread_count); in GetCudaLaunchConfig()
138 config.virtual_thread_count = virtual_thread_count; in GetCudaLaunchConfig()
166 config.virtual_thread_count = work_element_count; in GetCudaLaunchConfig()
190 config.virtual_thread_count = work_element_count; in GetCudaLaunchConfigFixedBlockSize()
197 dim3 virtual_thread_count = dim3(0, 0, 0); member
220 config.virtual_thread_count = dim3(xdim, ydim, 1); in GetCuda2DLaunchConfig()
276 config.virtual_thread_count = dim3(xdim, ydim, zdim); in GetCuda3DLaunchConfig()
Dcuda_kernel_helper_test.cu.cc44 CUDA_1D_KERNEL_LOOP(x, config.virtual_thread_count) { outbuf[x] = 0; } in SetOutbufZero()
49 CUDA_1D_KERNEL_LOOP(x, config.virtual_thread_count) { in Count1D()
57 CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) { in Count2D()
61 CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) { in Count2D()
65 int idx = x * config.virtual_thread_count.y + y; in Count2D()
71 CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) { in Count3D()
75 CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) { in Count3D()
79 CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count.z, Z) { in Count3D()
84 x * config.virtual_thread_count.y * config.virtual_thread_count.z + in Count3D()
85 y * config.virtual_thread_count.z + z; in Count3D()
/external/tensorflow/tensorflow/core/kernels/
Ddiag_op_gpu.cu.cc58 int virtual_thread_count = int(size * size); in operator ()() local
63 GetCudaLaunchConfig(virtual_thread_count, device); in operator ()()
65 device.stream()>>>(diag_config.virtual_thread_count, size, in operator ()()
105 0, device.stream()>>>(diag_config.virtual_thread_count, in operator ()()
Dinplace_ops_functor_gpu.cu.cc54 d.stream(), cfg.virtual_thread_count, nrows, ncols, loc, src, dst)); in DoParallelConcatUpdate()
122 d.stream(), cfg.virtual_thread_count, nrows, in DoInplaceOp()
128 cfg.virtual_thread_count, nrows, ncols, n, in DoInplaceOp()
134 cfg.virtual_thread_count, nrows, ncols, n, in DoInplaceOp()
156 d.stream(), cfg.virtual_thread_count, nrows, in DoInplaceOp()
Dresize_bilinear_op_gpu.cu.cc286 0, d.stream(), config.virtual_thread_count, images.data(), in operator ()()
292 config.thread_per_block, 0, d.stream(), config.virtual_thread_count, in operator ()()
324 config.virtual_thread_count, output_grad.data())); in operator ()()
332 config.thread_per_block, 0, d.stream(), config.virtual_thread_count, in operator ()()
339 config.thread_per_block, 0, d.stream(), config.virtual_thread_count, in operator ()()
Dfused_batch_norm_op.cu.cc42 d.stream()>>>(config.virtual_thread_count, in operator ()()
64 d.stream()>>>(config.virtual_thread_count, in operator ()()
Dmatrix_set_diag_op_gpu.cu.cc79 config.virtual_thread_count, m, n, minsize, in Compute()
86 config.virtual_thread_count, m, n, minsize, in Compute()
Dcrop_and_resize_op_gpu.cu.cc376 0, d.stream(), config.virtual_thread_count, image.data(), in operator ()()
411 d.stream(), config.virtual_thread_count, grads_image.data())); in operator ()()
426 config.thread_per_block, 0, d.stream(), config.virtual_thread_count, in operator ()()
461 d.stream(), config.virtual_thread_count, grads_boxes.data())); in operator ()()
470 config.thread_per_block, 0, d.stream(), config.virtual_thread_count, in operator ()()
Ddeterminant_op_gpu.cu.cc136 config.virtual_thread_count, n, lu_factor.data(), pivots, nullptr, in operator ()()
158 config.virtual_thread_count, n, lu_factor.data(), pivots, sign.data(), in operator ()()
Dsvd_op_gpu.cu.cc66 CUDA_AXIS_KERNEL_LOOP(batch, config.virtual_thread_count.x, X) { in ComputeValueOfVKernel()
67 CUDA_AXIS_KERNEL_LOOP(i, config.virtual_thread_count.y, Y) { in ComputeValueOfVKernel()
78 CUDA_1D_KERNEL_LOOP(i, config.virtual_thread_count) { in ExtractSignOfVKernel()
Ddilation_ops_gpu.cu.cc201 config.virtual_thread_count, input.data(), filter.data(), batch, in operator ()()
242 config.thread_per_block, 0, d.stream(), config.virtual_thread_count, in operator ()()
284 config.virtual_thread_count, input.data(), filter.data(), in operator ()()
Dconv_2d_gpu.h442 d.stream(), config.virtual_thread_count,
464 d.stream(), config.virtual_thread_count,
495 config.thread_per_block, 0, d.stream(), config.virtual_thread_count,
500 config.thread_per_block, 0, d.stream(), config.virtual_thread_count,
936 d.stream(), config.virtual_thread_count, input,
969 d.stream(), config.virtual_thread_count, in,
Ddepthtospace_op_gpu.cu.cc167 config.virtual_thread_count, input.data(), block_size, batch_size, in operator ()()
232 config.virtual_thread_count, input.data(), block_size, input_width, in operator ()()
Deye_functor_gpu.cu.cc56 device.stream()>>>(config.virtual_thread_count, batch_size, m, in operator ()()
Dspacetodepth_op_gpu.cu.cc163 config.virtual_thread_count, input.data(), block_size, batch_size, in operator ()()
228 config.virtual_thread_count, input.data(), block_size, output_width, in operator ()()
Dmatrix_band_part_op_gpu.cu.cc63 config.virtual_thread_count, batch_size, m, n, num_lower_diags, in operator ()()
Dresize_nearest_neighbor_op_gpu.cu.cc235 input_config.virtual_thread_count, input.data(), in_height, in_width, in operator ()()
243 d.stream(), input_config.virtual_thread_count, input.data(), in operator ()()
Dbias_op_gpu.cu.cc90 config.virtual_thread_count, input, bias, in compute()
95 config.virtual_thread_count, input, bias, in compute()
Dtile_functor_gpu.h80 d.stream(), cfg.virtual_thread_count, p, in TileSimple()
Davgpooling_op_gpu.cu.cc96 d.stream(), config.virtual_thread_count, top_diff, num, height, width, in RunAvePoolBackwardNHWC()
Dmultinomial_op_gpu.cu.cc115 d.stream()>>>(config.virtual_thread_count, num_classes, in operator ()()
Dspacetobatch_functor_gpu.cu.cc146 config.virtual_thread_count, in operator ()()
Dlu_op_gpu.cu.cc69 CUDA_1D_KERNEL_LOOP(index, config.virtual_thread_count) { in ComputePermutationFromTranspositionsKernel()
Dtranspose_functor_gpu.cu.cc85 d.stream(), cfg.virtual_thread_count, p, in TransposeSimple()