/external/tensorflow/tensorflow/core/kernels/image/ |
D | mirror_pad_op_gpu.cu.cc | 25 using GpuDevice = Eigen::GpuDevice; typedef 28 template struct functor::MirrorPad<GpuDevice, T, int32, 1>; \ 29 template struct functor::MirrorPad<GpuDevice, T, int32, 2>; \ 30 template struct functor::MirrorPad<GpuDevice, T, int32, 3>; \ 31 template struct functor::MirrorPad<GpuDevice, T, int32, 4>; \ 32 template struct functor::MirrorPad<GpuDevice, T, int32, 5>; \ 33 template struct functor::MirrorPad<GpuDevice, T, int64, 1>; \ 34 template struct functor::MirrorPad<GpuDevice, T, int64, 2>; \ 35 template struct functor::MirrorPad<GpuDevice, T, int64, 3>; \ 36 template struct functor::MirrorPad<GpuDevice, T, int64, 4>; \ [all …]
|
/external/tensorflow/tensorflow/core/kernels/ |
D | conv_2d_gpu_float.cu.cc | 32 template struct TransformDepth<Eigen::GpuDevice, float, int>; 34 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, float4>; 35 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, float2, 38 template struct SwapDimension0And2InTensor3<Eigen::GpuDevice, float4>; 39 template struct SwapDimension0And2InTensor3<Eigen::GpuDevice, float2, 43 template struct TransformFilter<Eigen::GpuDevice, float, int, 4>; 44 template struct ReverseTransformFilter<Eigen::GpuDevice, float, 4>; 45 template struct NHWCToNCHW<Eigen::GpuDevice, float, 4>; 46 template struct NCHWToNHWC<Eigen::GpuDevice, float, 4>; 47 template struct PadInput<Eigen::GpuDevice, float, int, 4>; [all …]
|
D | conv_2d_gpu_double.cu.cc | 27 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, double2, 30 template struct SwapDimension0And2InTensor3<Eigen::GpuDevice, double2, 34 template struct TransformFilter<Eigen::GpuDevice, double, int, 4>; 35 template struct ReverseTransformFilter<Eigen::GpuDevice, double, 4>; 36 template struct NHWCToNCHW<Eigen::GpuDevice, double, 4>; 37 template struct NCHWToNHWC<Eigen::GpuDevice, double, 4>; 38 template struct PadInput<Eigen::GpuDevice, double, int, 4>; 41 template struct TransformFilter<Eigen::GpuDevice, double, int, 5>; 42 template struct ReverseTransformFilter<Eigen::GpuDevice, double, 5>; 43 template struct NHWCToNCHW<Eigen::GpuDevice, double, 5>; [all …]
|
D | conv_2d_gpu_half.cu.cc | 32 template struct SwapDimension1And2InTensor3<Eigen::GpuDevice, Eigen::half>; 35 template struct TransformFilter<Eigen::GpuDevice, Eigen::half, int, 4>; 36 template struct ReverseTransformFilter<Eigen::GpuDevice, Eigen::half, 4>; 37 template struct NHWCToNCHW<Eigen::GpuDevice, Eigen::half, 4>; 38 template struct NCHWToNHWC<Eigen::GpuDevice, Eigen::half, 4>; 39 template struct PadInput<Eigen::GpuDevice, Eigen::half, int, 4>; 42 template struct TransformFilter<Eigen::GpuDevice, Eigen::half, int, 5>; 43 template struct ReverseTransformFilter<Eigen::GpuDevice, Eigen::half, 5>; 44 template struct NHWCToNCHW<Eigen::GpuDevice, Eigen::half, 5>; 45 template struct NCHWToNHWC<Eigen::GpuDevice, Eigen::half, 5>; [all …]
|
D | scan_ops_gpu_int.cu.cc | 24 using Eigen::GpuDevice; 25 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<int64_t>, 27 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<int64_t>, 29 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<int32>, 31 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<int32>,
|
D | concat_lib_gpu.h | 34 const Eigen::GpuDevice& gpu_device, 40 void ConcatGPUImpl(const Eigen::GpuDevice& d, 49 const Eigen::GpuDevice& gpu_device, \ 54 const Eigen::GpuDevice& gpu_device, \ 59 const Eigen::GpuDevice& d, \ 64 const Eigen::GpuDevice& d, \
|
D | depthwise_conv_op_gpu_float.cu.cc | 23 using Eigen::GpuDevice; 25 template struct LaunchDepthwiseConvOp<GpuDevice, float>; 26 template struct LaunchDepthwiseConvBackpropInputOp<GpuDevice, float>; 27 template struct LaunchDepthwiseConvBackpropFilterOp<GpuDevice, float>;
|
D | depthwise_conv_op_gpu_double.cu.cc | 23 using Eigen::GpuDevice; 25 template struct LaunchDepthwiseConvOp<GpuDevice, double>; 26 template struct LaunchDepthwiseConvBackpropInputOp<GpuDevice, double>; 27 template struct LaunchDepthwiseConvBackpropFilterOp<GpuDevice, double>;
|
D | depthwise_conv_op_gpu_half.cu.cc | 23 using Eigen::GpuDevice; 25 template struct LaunchDepthwiseConvOp<GpuDevice, Eigen::half>; 26 template struct LaunchDepthwiseConvBackpropInputOp<GpuDevice, Eigen::half>; 27 template struct LaunchDepthwiseConvBackpropFilterOp<GpuDevice, Eigen::half>;
|
D | scan_ops_gpu_float.cu.cc | 24 using Eigen::GpuDevice; 25 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<float>, 27 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<float>, 29 template struct functor::Scan<GpuDevice, functor::LogSumExpReducer<float>,
|
D | scan_ops_gpu_double.cu.cc | 24 using Eigen::GpuDevice; 25 template struct functor::Scan<GpuDevice, Eigen::internal::SumReducer<double>, 27 template struct functor::Scan<GpuDevice, Eigen::internal::ProdReducer<double>, 29 template struct functor::Scan<GpuDevice, functor::LogSumExpReducer<double>,
|
D | scan_ops_gpu_half.cu.cc | 24 using Eigen::GpuDevice; 26 GpuDevice, Eigen::internal::SumReducer<Eigen::half>, Eigen::half>; 28 GpuDevice, Eigen::internal::ProdReducer<Eigen::half>, Eigen::half>; 29 template struct functor::Scan<GpuDevice, functor::LogSumExpReducer<Eigen::half>,
|
D | maxpooling_op_gpu.h | 42 const Eigen::GpuDevice& d, bool propagate_nans, 52 const Eigen::GpuDevice& d); 60 const Eigen::GpuDevice& d, const bool include_batch_in_index); 68 const Eigen::GpuDevice& d, const bool include_batch_in_index); 79 const T* top_diff, T* bottom_diff, const Eigen::GpuDevice& d);
|
D | tile_functor_gpu_bool.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, bool, int32>; 27 template struct Tile<GpuDevice, bool, int64>;
|
D | tile_functor_gpu_double.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, double, int32>; 27 template struct Tile<GpuDevice, double, int64>;
|
D | tile_functor_gpu_float.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, float, int32>; 27 template struct Tile<GpuDevice, float, int64>;
|
D | tile_functor_gpu_int32.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, int32, int32>; 27 template struct Tile<GpuDevice, int32, int64>;
|
D | tile_functor_gpu_complex64.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, complex64, int32>; 27 template struct Tile<GpuDevice, complex64, int64>;
|
D | tile_functor_gpu_complex128.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, complex128, int32>; 27 template struct Tile<GpuDevice, complex128, int64>;
|
D | tile_functor_gpu_int64.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, int64, int32>; 27 template struct Tile<GpuDevice, int64, int64>;
|
D | tile_functor_gpu_int16.cu.cc | 24 using Eigen::GpuDevice; 26 template struct Tile<GpuDevice, int16, int32>; 27 template struct Tile<GpuDevice, int16, int64>;
|
/external/eigen/bench/tensors/ |
D | tensor_benchmarks_fp16_gpu.cu | 14 Eigen::GpuDevice device(&stream); \ 15 BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N); \ 44 Eigen::GpuDevice device(&stream); \ 45 BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, D1, D2, D3); \ 63 Eigen::GpuDevice device(&stream); \ 64 BenchmarkSuite<Eigen::GpuDevice, Eigen::half> suite(device, N); \
|
D | tensor_benchmarks_gpu.cu | 14 Eigen::GpuDevice device(&stream); \ 15 BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N); \ 44 Eigen::GpuDevice device(&stream); \ 45 BenchmarkSuite<Eigen::GpuDevice, float> suite(device, D1, D2, D3); \ 63 Eigen::GpuDevice device(&stream); \ 64 BenchmarkSuite<Eigen::GpuDevice, float> suite(device, N); \
|
/external/tensorflow/tensorflow/core/grappler/optimizers/ |
D | implementation_selector_test.cc | 40 constexpr char GpuDevice[] = "/device:GPU:0"; variable 73 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice)}); in TEST_F() 97 NDef("case", "StatelessCase", {"x"}, {{"T", DT_FLOAT}}, GpuDevice)}); in TEST_F() 122 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F() 124 GpuDevice), in TEST_F() 214 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F() 216 GpuDevice), in TEST_F() 218 NDef("y1", "XTimesTwo", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F() 219 NDef("z1", "Identity", {"y1"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F() 270 NDef("case", "Case", {"x"}, {{"T", DT_FLOAT}}, GpuDevice), in TEST_F() [all …]
|
/external/tensorflow/tensorflow/core/util/ |
D | gpu_launch_config.h | 128 const Eigen::GpuDevice& d) { in GetGpuLaunchConfig() 147 const Eigen::GpuDevice& d) { in GetCudaLaunchConfig() 157 const Eigen::GpuDevice& d, DeviceFunc func, in GetGpuLaunchConfig() 193 int work_element_count, const Eigen::GpuDevice& d, DeviceFunc func, in GetGpuLaunchConfigFixedBlockSize() 227 const Eigen::GpuDevice& d) { in GetGpu2DLaunchConfig() 255 const Eigen::GpuDevice& d) { in GetCuda2DLaunchConfig() 268 const Eigen::GpuDevice& d, in GetGpu3DLaunchConfig() 344 const Eigen::GpuDevice& d, in GetGpu2DLaunchConfig() 356 const Eigen::GpuDevice& d, in GetCuda2DLaunchConfig()
|