Home
last modified time | relevance | path

Searched defs:compute_capability (Results 1 – 12 of 12) sorted by relevance

/external/tensorflow/tensorflow/compiler/xla/service/gpu/
Dcudnn_pad_for_convolutions.h34 explicit CudnnPadForConvolutions(se::CudaComputeCapability compute_capability) in CudnnPadForConvolutions()
Dcudnn_vectorize_convolutions.h49 se::CudaComputeCapability compute_capability) in CudnnVectorizeConvolutions()
Dcudnn_support_utils.cc28 const se::CudaComputeCapability& compute_capability, in CudnnSupportsOptimizedIntegerConvolution()
Dcudnn_vectorize_convolutions.cc261 const se::CudaComputeCapability& compute_capability, in TryRevectorizeConv()
399 const se::CudaComputeCapability& compute_capability, in TryVectorizeConv()
Dcudnn_vectorize_convolutions_test.cc37 StatusOr<bool> Run(std::pair<int, int> compute_capability, in Run() argument
Dcudnn_pad_for_convolutions.cc295 int pad_to, const se::CudaComputeCapability& compute_capability, in TryResolvePaddedShapesForIntegerConvolution()
Dcudnn_simplify_padding_test.cc46 StatusOr<bool> RunEndToEnd(std::pair<int, int> compute_capability, in RunEndToEnd() argument
/external/tensorflow/tensorflow/compiler/xla/service/gpu/llvm_gpu_backend/
Dgpu_backend_lib.cc89 static std::string GetSmName(se::CudaComputeCapability compute_capability) { in GetSmName()
360 llvm::Triple target_triple, se::CudaComputeCapability compute_capability, in NVPTXGetTargetMachine()
535 auto compute_capability = in CompileToPtx() local
793 auto compute_capability = in AMDGPUTargetModuleLinker() local
863 auto compute_capability = in AMDGPUGetTargetMachine() local
923 auto compute_capability = in CompileToHsaco() local
/external/tensorflow/tensorflow/core/profiler/protobuf/
Dhardware_types.proto29 GPUComputeCapability compute_capability = 5; field
/external/tensorflow/tensorflow/core/protobuf/
Dautotuning.proto98 ComputeCapability compute_capability = 4; field
/external/tensorflow/tensorflow/core/grappler/optimizers/
Dgeneric_layout_optimizer.cc63 double compute_capability = 0.0; in GetNumGPUs() local
Dremapper.cc423 double compute_capability = 0.0; in RuntimeFusionEnabled() local