Home
last modified time | relevance | path

Searched refs:GpuDevice (Results 1 – 25 of 375) sorted by relevance

12345678910>>...15

/external/tensorflow/tensorflow/core/kernels/image/
Dmirror_pad_op_gpu.cu.cc25 using GpuDevice = Eigen::GpuDevice; typedef
28 template struct functor::MirrorPad<GpuDevice, T, int32, 1>; \
29 template struct functor::MirrorPad<GpuDevice, T, int32, 2>; \
30 template struct functor::MirrorPad<GpuDevice, T, int32, 3>; \
31 template struct functor::MirrorPad<GpuDevice, T, int32, 4>; \
32 template struct functor::MirrorPad<GpuDevice, T, int32, 5>; \
33 template struct functor::MirrorPad<GpuDevice, T, int64, 1>; \
34 template struct functor::MirrorPad<GpuDevice, T, int64, 2>; \
35 template struct functor::MirrorPad<GpuDevice, T, int64, 3>; \
36 template struct functor::MirrorPad<GpuDevice, T, int64, 4>; \
[all …]
/external/tensorflow/tensorflow/core/kernels/
Dconv_2d_gpu_float.cu.cc32 template struct TransformDepth<Eigen::GpuDevice, float, int>;
34 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, float4>;
35 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, float2,
38 template struct SwapDimension0And2InTensor3<Eigen::GpuDevice, float4>;
39 template struct SwapDimension0And2InTensor3<Eigen::GpuDevice, float2,
43 template struct TransformFilter<Eigen::GpuDevice, float, int, 4>;
44 template struct ReverseTransformFilter<Eigen::GpuDevice, float, 4>;
45 template struct NHWCToNCHW<Eigen::GpuDevice, float, 4>;
46 template struct NCHWToNHWC<Eigen::GpuDevice, float, 4>;
47 template struct PadInput<Eigen::GpuDevice, float, int, 4>;
[all …]
Dconv_2d_gpu_double.cu.cc27 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, double2,
30 template struct SwapDimension0And2InTensor3<Eigen::GpuDevice, double2,
34 template struct TransformFilter<Eigen::GpuDevice, double, int, 4>;
35 template struct ReverseTransformFilter<Eigen::GpuDevice, double, 4>;
36 template struct NHWCToNCHW<Eigen::GpuDevice, double, 4>;
37 template struct NCHWToNHWC<Eigen::GpuDevice, double, 4>;
38 template struct PadInput<Eigen::GpuDevice, double, int, 4>;
41 template struct TransformFilter<Eigen::GpuDevice, double, int, 5>;
42 template struct ReverseTransformFilter<Eigen::GpuDevice, double, 5>;
43 template struct NHWCToNCHW<Eigen::GpuDevice, double, 5>;
[all …]
Dconv_2d_gpu_half.cu.cc32 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, Eigen::half>;
35 template struct TransformFilter<Eigen::GpuDevice, Eigen::half, int, 4>;
36 template struct ReverseTransformFilter<Eigen::GpuDevice, Eigen::half, 4>;
37 template struct NHWCToNCHW<Eigen::GpuDevice, Eigen::half, 4>;
38 template struct NCHWToNHWC<Eigen::GpuDevice, Eigen::half, 4>;
39 template struct PadInput<Eigen::GpuDevice, Eigen::half, int, 4>;
42 template struct TransformFilter<Eigen::GpuDevice, Eigen::half, int, 5>;
43 template struct ReverseTransformFilter<Eigen::GpuDevice, Eigen::half, 5>;
44 template struct NHWCToNCHW<Eigen::GpuDevice, Eigen::half, 5>;
45 template struct NCHWToNHWC<Eigen::GpuDevice, Eigen::half, 5>;
[all …]
Dscan_ops_gpu_int.cu.cc24 using Eigen::GpuDevice;
25 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<int64>,
27 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<int64>,
29 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<int32>,
31 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<int32>,
Dconcat_lib_gpu.h34 const Eigen::GpuDevice& gpu_device,
40 void ConcatGPUImpl(const Eigen::GpuDevice& d,
49 const Eigen::GpuDevice& gpu_device, \
54 const Eigen::GpuDevice& gpu_device, \
59 const Eigen::GpuDevice& d, \
64 const Eigen::GpuDevice& d, \
Ddepthwise_conv_op_gpu_double.cu.cc23 using Eigen::GpuDevice;
25 template struct LaunchDepthwiseConvOp<GpuDevice, double>;
26 template struct LaunchDepthwiseConvBackpropInputOp<GpuDevice, double>;
27 template struct LaunchDepthwiseConvBackpropFilterOp<GpuDevice, double>;
Ddepthwise_conv_op_gpu_float.cu.cc23 using Eigen::GpuDevice;
25 template struct LaunchDepthwiseConvOp<GpuDevice, float>;
26 template struct LaunchDepthwiseConvBackpropInputOp<GpuDevice, float>;
27 template struct LaunchDepthwiseConvBackpropFilterOp<GpuDevice, float>;
Ddepthwise_conv_op_gpu_half.cu.cc23 using Eigen::GpuDevice;
25 template struct LaunchDepthwiseConvOp<GpuDevice, Eigen::half>;
26 template struct LaunchDepthwiseConvBackpropInputOp<GpuDevice, Eigen::half>;
27 template struct LaunchDepthwiseConvBackpropFilterOp<GpuDevice, Eigen::half>;
Dscan_ops_gpu_double.cu.cc24 using Eigen::GpuDevice;
25 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<double>,
27 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<double>,
29 template struct functor::Scan<GpuDevice, functor::LogSumExpReducer<double>,
Dscan_ops_gpu_float.cu.cc24 using Eigen::GpuDevice;
25 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<float>,
27 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<float>,
29 template struct functor::Scan<GpuDevice, functor::LogSumExpReducer<float>,
Dscan_ops_gpu_half.cu.cc24 using Eigen::GpuDevice;
26 GpuDevice, Eigen::internal::SumReducer<Eigen::half>, Eigen::half>;
28 GpuDevice, Eigen::internal::ProdReducer<Eigen::half>, Eigen::half>;
29 template struct functor::Scan<GpuDevice, functor::LogSumExpReducer<Eigen::half>,
Dmaxpooling_op_gpu.h42 const Eigen::GpuDevice& d, bool propagate_nans,
52 const Eigen::GpuDevice& d);
60 const Eigen::GpuDevice& d, const bool include_batch_in_index);
68 const Eigen::GpuDevice& d, const bool include_batch_in_index);
79 const T* top_diff, T* bottom_diff, const Eigen::GpuDevice& d);
Dtile_functor_gpu_float.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, float, int32>;
27 template struct Tile<GpuDevice, float, int64>;
Dtile_functor_gpu_double.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, double, int32>;
27 template struct Tile<GpuDevice, double, int64>;
Dtile_functor_gpu_bool.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, bool, int32>;
27 template struct Tile<GpuDevice, bool, int64>;
Dtile_functor_gpu_int16.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, int16, int32>;
27 template struct Tile<GpuDevice, int16, int64>;
Dtile_functor_gpu_int32.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, int32, int32>;
27 template struct Tile<GpuDevice, int32, int64>;
Dtile_functor_gpu_complex128.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, complex128, int32>;
27 template struct Tile<GpuDevice, complex128, int64>;
Dtile_functor_gpu_complex64.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, complex64, int32>;
27 template struct Tile<GpuDevice, complex64, int64>;
Dtile_functor_gpu_int64.cu.cc24 using Eigen::GpuDevice;
26 template struct Tile<GpuDevice, int64, int32>;
27 template struct Tile<GpuDevice, int64, int64>;
/external/eigen/bench/tensors/
Dtensor_benchmarks_fp16_gpu.cu14 Eigen::GpuDevice device(&stream); \
15 BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N); \
44 Eigen::GpuDevice device(&stream); \
45 BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, D1, D2, D3); \
63 Eigen::GpuDevice device(&stream); \
64 BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N); \
Dtensor_benchmarks_gpu.cu14 Eigen::GpuDevice device(&stream); \
15 BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N); \
44 Eigen::GpuDevice device(&stream); \
45 BenchmarkSuite<Eigen::GpuDevice, float> suite(device, D1, D2, D3); \
63 Eigen::GpuDevice device(&stream); \
64 BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N); \
/external/tensorflow/tensorflow/core/grappler/optimizers/
Dimplementation_selector_test.cc40 constexpr char GpuDevice[] = "/device:GPU:0"; variable
73 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice)}); in TEST_F()
97 NDef("case", "StatelessCase", {"x"}, {{"T", DT_FLOAT}}, GpuDevice)}); in TEST_F()
122 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F()
124 GpuDevice), in TEST_F()
214 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F()
216 GpuDevice), in TEST_F()
218 NDef("y1", "XTimesTwo", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F()
219 NDef("z1", "Identity", {"y1"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F()
270 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F()
[all …]
/external/tensorflow/tensorflow/core/util/
Dgpu_launch_config.h128 const Eigen::GpuDevice& d) { in GetGpuLaunchConfig()
147 const Eigen::GpuDevice& d) { in GetCudaLaunchConfig()
157 const Eigen::GpuDevice& d, DeviceFunc func, in GetGpuLaunchConfig()
193 int work_element_count, const Eigen::GpuDevice& d, DeviceFunc func, in GetGpuLaunchConfigFixedBlockSize()
227 const Eigen::GpuDevice& d) { in GetGpu2DLaunchConfig()
255 const Eigen::GpuDevice& d) { in GetCuda2DLaunchConfig()
268 const Eigen::GpuDevice& d, in GetGpu3DLaunchConfig()
340 const Eigen::GpuDevice& d, in GetGpu2DLaunchConfig()
352 const Eigen::GpuDevice& d, in GetCuda2DLaunchConfig()

12345678910>>...15