/external/tensorflow/tensorflow/core/kernels/ |
D | matmul_op.cc | 291 AlgorithmConfig algorithm_config(kNoAlgorithm); in launch() local 300 &algorithm_config)) { in launch() 360 algorithm_config.set_algorithm(best_result.algorithm()); in launch() 363 algorithm_config); in launch() 364 if (algorithm_config.algorithm() != kNoAlgorithm && in launch() 365 algorithm_config.algorithm() != kDefaultBlasGemm && in launch() 366 algorithm_config.algorithm() != kDefaultBlasGemv) { in launch() 372 &c_ptr, n, computation_type, algorithm_config.algorithm(), in launch() 394 algorithm_config.algorithm() == kNoAlgorithm || in launch() 395 algorithm_config.algorithm() == kDefaultBlasGemm || in launch() [all …]
|
D | conv_ops_fused_impl.h | 507 se::dnn::AlgorithmConfig* algorithm_config) { 509 if (AutoTuneFusedConv::GetInstance()->Find(params, algorithm_config)) { 548 TF_RETURN_IF_ERROR(BestCudnnConvAlgorithm(results, algorithm_config)); 549 AutoTuneFusedConv::GetInstance()->Insert(params, *algorithm_config); 776 const auto launch = [&](se::dnn::AlgorithmConfig algorithm_config, 789 scratch_allocator, algorithm_config, profile_result) 793 se::dnn::AlgorithmConfig algorithm_config; 802 &algorithm_config); 807 bool cudnn_launch_status = launch(algorithm_config, &scratch_allocator,
|
D | conv_ops_3d.cc | 435 AlgorithmConfig algorithm_config; in launch() local 438 conv_parameters, &algorithm_config)) { in launch() 480 OP_REQUIRES_OK(ctx, BestCudnnConvAlgorithm(results, &algorithm_config)); in launch() 481 AutoTuneConv3d::GetInstance()->Insert(conv_parameters, algorithm_config); in launch() 490 algorithm_config, nullptr) in launch()
|
D | conv_grad_ops_3d.cc | 1357 AlgorithmConfig algorithm_config; in Compute() local 1359 conv_parameters, &algorithm_config)) { in Compute() 1398 algorithm_config.set_algorithm(best_result.algorithm()); in Compute() 1401 algorithm_config.set_algorithm_no_scratch( in Compute() 1405 algorithm_config); in Compute() 1414 algorithm_config, nullptr) in Compute() 1763 AlgorithmConfig algorithm_config; in Compute() local 1765 conv_parameters, &algorithm_config)) { in Compute() 1805 algorithm_config.set_algorithm(best_result.algorithm()); in Compute() 1808 algorithm_config.set_algorithm_no_scratch( in Compute() [all …]
|
D | conv_ops.cc | 847 AlgorithmConfig algorithm_config; in operator ()() local 849 !AutoTuneConv::GetInstance()->Find(conv_parameters, &algorithm_config)) { in operator ()() 890 OP_REQUIRES_OK(ctx, BestCudnnConvAlgorithm(results, &algorithm_config)); in operator ()() 891 AutoTuneConv::GetInstance()->Insert(conv_parameters, algorithm_config); in operator ()() 900 algorithm_config, nullptr) in operator ()()
|
D | conv_grad_filter_ops.cc | 839 AlgorithmConfig algorithm_config; in operator ()() local 841 conv_parameters, &algorithm_config)) { in operator ()() 879 OP_REQUIRES_OK(ctx, BestCudnnConvAlgorithm(results, &algorithm_config)); in operator ()() 881 algorithm_config); in operator ()() 889 algorithm_config, nullptr) in operator ()()
|
D | conv_grad_input_ops.cc | 951 AlgorithmConfig algorithm_config; in operator ()() local 953 conv_parameters, &algorithm_config)) { in operator ()() 990 OP_REQUIRES_OK(ctx, BestCudnnConvAlgorithm(results, &algorithm_config)); in operator ()() 992 algorithm_config); in operator ()() 999 algorithm_config, nullptr) in operator ()()
|
/external/tensorflow/tensorflow/stream_executor/cuda/ |
D | cuda_dnn.cc | 1010 const dnn::AlgorithmConfig& algorithm_config, in CudnnRnnDescriptor() argument 1019 rnn_algo_(ToCudnnRNNAlgo(algorithm_config.algorithm())), in CudnnRnnDescriptor() 1025 algorithm_config_(algorithm_config), in CudnnRnnDescriptor() 1037 const dnn::AlgorithmConfig& algorithm_config, float dropout, uint64 seed, in Create() argument 1044 cudnnRNNAlgo_t rnn_algo = ToCudnnRNNAlgo(algorithm_config.algorithm()); in Create() 1091 if (RnnTensorOpMathEnabled() && algorithm_config.algorithm().has_value()) { in Create() 1093 algorithm_config.algorithm()->tensor_ops_enabled() in Create() 1103 compute_type, algorithm_config, in Create() 1117 const dnn::AlgorithmConfig& algorithm_config() const { in algorithm_config() function in stream_executor::gpu::CudnnRnnDescriptor 1649 auto algo_desc = *rnn_desc.algorithm_config().algorithm(); in DoRnnForwardImpl() [all …]
|
D | cuda_dnn.h | 54 const dnn::AlgorithmConfig& algorithm_config, float dropout, uint64 seed, 284 const dnn::AlgorithmConfig& algorithm_config, 298 const dnn::AlgorithmConfig& algorithm_config, 316 const dnn::AlgorithmConfig& algorithm_config, 330 const dnn::AlgorithmConfig& algorithm_config, 595 const dnn::AlgorithmConfig& algorithm_config, 659 const dnn::AlgorithmConfig& algorithm_config,
|
/external/tensorflow/tensorflow/contrib/fused_conv/kernels/ |
D | fused_conv2d_bias_activation_op.cc | 692 dnn::AlgorithmConfig algorithm_config; in launch() local 694 fused_conv_parameters, &algorithm_config)) { in launch() 748 ctx, internal::BestCudnnConvAlgorithm(results, &algorithm_config)); in launch() 750 algorithm_config); in launch() 760 &output_ptr, &scratch_allocator, algorithm_config, in launch()
|
/external/tensorflow/tensorflow/stream_executor/rocm/ |
D | rocm_dnn.h | 52 const dnn::AlgorithmConfig& algorithm_config, float dropout, uint64 seed, 275 const dnn::AlgorithmConfig& algorithm_config, 289 const dnn::AlgorithmConfig& algorithm_config, 307 const dnn::AlgorithmConfig& algorithm_config, 321 const dnn::AlgorithmConfig& algorithm_config, 766 const dnn::AlgorithmConfig& algorithm_config,
|
D | rocm_dnn.cc | 2279 const dnn::AlgorithmConfig& algorithm_config, float dropout, uint64 seed, in createRnnDescriptor() argument 2598 const dnn::AlgorithmConfig& algorithm_config, in DoPrepareForConvolution() argument 2616 absl::optional<dnn::AlgorithmDesc> algo_desc = algorithm_config.algorithm(); in DoPrepareForConvolution() 3156 const dnn::AlgorithmConfig& algorithm_config, in DoFusedConvolve() argument 3173 const dnn::AlgorithmConfig& algorithm_config, in DoFusedConvolve() argument 3191 const dnn::AlgorithmConfig& algorithm_config, in DoFusedConvolve() argument 3208 const dnn::AlgorithmConfig& algorithm_config, in DoFusedConvolve() argument
|
/external/tensorflow/tensorflow/stream_executor/ |
D | dnn.h | 1126 const dnn::AlgorithmConfig& algorithm_config, 1143 const dnn::AlgorithmConfig& algorithm_config, 1163 const dnn::AlgorithmConfig& algorithm_config, 1181 const dnn::AlgorithmConfig& algorithm_config, 1196 const AlgorithmConfig& algorithm_config, 1202 output_data, convolution_descriptor, algorithm_config, 2046 const dnn::AlgorithmConfig& algorithm_config, 2550 const AlgorithmConfig& algorithm_config,
|
D | stream.h | 312 const dnn::AlgorithmConfig &algorithm_config, 323 const dnn::AlgorithmConfig &algorithm_config, 334 const dnn::AlgorithmConfig &algorithm_config, 348 const dnn::AlgorithmConfig &algorithm_config, 362 const dnn::AlgorithmConfig &algorithm_config, 377 const dnn::AlgorithmConfig &algorithm_config, 391 const dnn::AlgorithmConfig &algorithm_config, 413 const dnn::AlgorithmConfig &algorithm_config, 425 const dnn::AlgorithmConfig &algorithm_config, 437 const dnn::AlgorithmConfig &algorithm_config, [all …]
|
D | stream.cc | 451 const dnn::AlgorithmConfig &algorithm_config, in ThenFusedConvolveWithAlgorithm() argument 458 PARAM(algorithm_config)); in ThenFusedConvolveWithAlgorithm() 467 algorithm_config, output_profile_result); in ThenFusedConvolveWithAlgorithm() 489 const dnn::AlgorithmConfig &algorithm_config, in ThenFusedConvolveWithAlgorithm() argument 496 PARAM(algorithm_config)); in ThenFusedConvolveWithAlgorithm() 505 algorithm_config, output_profile_result); in ThenFusedConvolveWithAlgorithm() 528 const dnn::AlgorithmConfig &algorithm_config, in ThenFusedConvolveWithAlgorithm() argument 535 PARAM(output_descriptor), PARAM(output), PARAM(algorithm_config)); in ThenFusedConvolveWithAlgorithm() 544 algorithm_config, output_profile_result); in ThenFusedConvolveWithAlgorithm() 566 const dnn::AlgorithmConfig &algorithm_config, in ThenFusedConvolveWithAlgorithm() argument [all …]
|
D | stream_executor_pimpl.cc | 385 const dnn::AlgorithmConfig &algorithm_config, float dropout, uint64 seed, in createRnnDescriptor() argument 394 direction_mode, rnn_mode, data_type, algorithm_config, dropout, seed, in createRnnDescriptor()
|
D | stream_executor_pimpl.h | 411 const dnn::AlgorithmConfig &algorithm_config, float dropout, uint64 seed,
|