/external/tensorflow/tensorflow/compiler/xla/service/gpu/ |
D | cudnn_conv_runner.cc | 218 BatchDescriptor output_descriptor(effective_num_dimensions); in RunCudnnConvImpl() local 219 output_descriptor.set_layout(output_dl) in RunCudnnConvImpl() 224 output_descriptor.set_spatial_dim( in RunCudnnConvImpl() 232 output_descriptor.set_spatial_dim(static_cast<DimIndex>(0), 1); in RunCudnnConvImpl() 247 convolution_descriptor, output_descriptor, &output_buf, in RunCudnnConvImpl() 257 filter_descriptor, filter_buf, output_descriptor, output_buf, in RunCudnnConvImpl() 268 input_descriptor, input_buf, output_descriptor, output_buf, in RunCudnnConvImpl() 303 output_descriptor, &output_buf, scratch_allocator, algorithm, in RunCudnnConvImpl()
|
/external/tensorflow/tensorflow/stream_executor/ |
D | dnn.h | 1124 const dnn::BatchDescriptor& output_descriptor, 1141 const dnn::BatchDescriptor& output_descriptor, 1160 const dnn::BatchDescriptor& output_descriptor, 1179 const dnn::BatchDescriptor& output_descriptor, 1193 const BatchDescriptor& output_descriptor, 1201 input_data, filter_descriptor, filter_data, output_descriptor, 1244 const BatchDescriptor& output_descriptor, DeviceMemoryBase output_data, 1255 const dnn::BatchDescriptor& output_descriptor, 1263 filter_data, output_descriptor, *output_data, 1290 const dnn::BatchDescriptor& output_descriptor, [all …]
|
D | stream.cc | 449 const dnn::BatchDescriptor &output_descriptor, DeviceMemory<double> *output, in ThenFusedConvolveWithAlgorithm() argument 457 PARAM(activation_mode), PARAM(output_descriptor), PARAM(output), in ThenFusedConvolveWithAlgorithm() 466 activation_mode, output_descriptor, output, scratch_allocator, in ThenFusedConvolveWithAlgorithm() 487 const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> *output, in ThenFusedConvolveWithAlgorithm() argument 495 PARAM(activation_mode), PARAM(output_descriptor), PARAM(output), in ThenFusedConvolveWithAlgorithm() 504 activation_mode, output_descriptor, output, scratch_allocator, in ThenFusedConvolveWithAlgorithm() 526 const dnn::BatchDescriptor &output_descriptor, in ThenFusedConvolveWithAlgorithm() argument 535 PARAM(output_descriptor), PARAM(output), PARAM(algorithm_config)); in ThenFusedConvolveWithAlgorithm() 543 activation_mode, output_descriptor, output, scratch_allocator, in ThenFusedConvolveWithAlgorithm() 564 const dnn::BatchDescriptor &output_descriptor, DeviceMemory<int8> *output, in ThenFusedConvolveWithAlgorithm() argument [all …]
|
D | stream.h | 281 const dnn::BatchDescriptor &output_descriptor, 291 const dnn::BatchDescriptor &output_descriptor, 301 const dnn::BatchDescriptor &output_descriptor, 310 const dnn::BatchDescriptor &output_descriptor, 321 const dnn::BatchDescriptor &output_descriptor, 332 const dnn::BatchDescriptor &output_descriptor, 346 const dnn::BatchDescriptor &output_descriptor, 360 const dnn::BatchDescriptor &output_descriptor, 375 const dnn::BatchDescriptor &output_descriptor, 389 const dnn::BatchDescriptor &output_descriptor, DeviceMemory<int8> *output, [all …]
|
/external/tensorflow/tensorflow/stream_executor/cuda/ |
D | cuda_dnn.h | 267 const dnn::BatchDescriptor& output_descriptor, 282 const dnn::BatchDescriptor& output_descriptor, 296 const dnn::BatchDescriptor& output_descriptor, 313 const dnn::BatchDescriptor& output_descriptor, 328 const dnn::BatchDescriptor& output_descriptor, 340 const dnn::BatchDescriptor& output_descriptor, in DoConvolveQuantized() argument 353 const dnn::BatchDescriptor& output_descriptor, in DoConvolveQuantized() argument 366 const dnn::BatchDescriptor& output_descriptor, in DoSeparableConvolve() argument 592 const dnn::BatchDescriptor& output_descriptor, 656 const dnn::BatchDescriptor& output_descriptor,
|
D | cuda_dnn.cc | 2629 DeviceMemoryBase filter_data, const dnn::BatchDescriptor& output_descriptor, in DoPrepareForConvolution() argument 2642 output_descriptor, in DoPrepareForConvolution() 2643 ToCudnnDataType(element_type, output_descriptor.layout())); in DoPrepareForConvolution() 2687 DeviceMemoryBase filter_data, const dnn::BatchDescriptor& output_descriptor, in DoConvolve() argument 2694 CudnnTensorDescriptor output_nd(output_descriptor, cudnn_type); in DoConvolve() 2745 output_descriptor.feature_map_count())); in DoConvolve() 2749 output_descriptor.feature_map_count())); in DoConvolve() 2755 output_descriptor)) { in DoConvolve() 2768 output_descriptor)) { in DoConvolve() 2782 output_descriptor.layout() == dnn::DataLayout::kBatchDepthYX && in DoConvolve() [all …]
|
/external/tensorflow/tensorflow/stream_executor/rocm/ |
D | rocm_dnn.h | 258 const dnn::BatchDescriptor& output_descriptor, 273 const dnn::BatchDescriptor& output_descriptor, 287 const dnn::BatchDescriptor& output_descriptor, 304 const dnn::BatchDescriptor& output_descriptor, 319 const dnn::BatchDescriptor& output_descriptor, 331 const dnn::BatchDescriptor& output_descriptor, in DoConvolveQuantized() argument 344 const dnn::BatchDescriptor& output_descriptor, in DoConvolveQuantized() argument 357 const dnn::BatchDescriptor& output_descriptor, in DoSeparableConvolve() argument 541 const dnn::BatchDescriptor& output_descriptor, 715 const dnn::BatchDescriptor& output_descriptor, [all …]
|
D | rocm_dnn.cc | 936 miopenTensorDescriptor_t output_descriptor, in Execute() argument 940 output_descriptor, output_data, fusion_args_); in Execute() 2595 DeviceMemoryBase filter_data, const dnn::BatchDescriptor& output_descriptor, in DoPrepareForConvolution() argument 2608 output_descriptor, in DoPrepareForConvolution() 2609 ToMIOpenDataType(element_type, output_descriptor.layout())}; in DoPrepareForConvolution() 2775 BatchDescriptor* output_descriptor, DeviceMemoryBase backward_output_data, in MaybeTransformLayout() argument 2777 if (output_descriptor->layout() == dnn::DataLayout::kBatchDepthYX) { in MaybeTransformLayout() 2780 CHECK(output_descriptor->layout() == dnn::DataLayout::kBatchYXDepth); in MaybeTransformLayout() 2785 transformed_output_descriptor.CloneFrom(*output_descriptor); in MaybeTransformLayout() 2788 *output_descriptor, static_cast<miopenDataType_t>(miopen_type)}; in MaybeTransformLayout() [all …]
|