/external/tensorflow/tensorflow/compiler/xla/service/gpu/llvm_gpu_backend/ |
D | gpu_backend_lib.cc | 145 const HloModuleConfig& hlo_module_config, absl::string_view feature_str) { in GetTargetMachine() argument 164 switch (hlo_module_config.debug_options().xla_backend_optimization_level()) { in GetTargetMachine() 339 const HloModuleConfig& hlo_module_config, in NVPTXTargetModuleLinker() argument 353 hlo_module_config.debug_options().xla_gpu_ftz()); in NVPTXTargetModuleLinker() 356 if (hlo_module_config.debug_options().xla_gpu_ftz()) { in NVPTXTargetModuleLinker() 367 const HloModuleConfig& hlo_module_config) { in NVPTXGetTargetMachine() argument 371 hlo_module_config, "+ptx60"); in NVPTXGetTargetMachine() 378 const HloModuleConfig& hlo_module_config, in LinkAndOptimizeModule() argument 384 TF_RETURN_IF_ERROR(module_linker(module, gpu_version, hlo_module_config, in LinkAndOptimizeModule() 416 hlo_module_config.debug_options().xla_backend_optimization_level(); in LinkAndOptimizeModule() [all …]
|
D | gpu_backend_lib.h | 44 const HloModuleConfig& hlo_module_config, const string& libdevice_dir_path, 54 const HloModuleConfig& hlo_module_config, const string& rocdl_dir_path);
|
D | BUILD | 55 "//tensorflow/compiler/xla/service:hlo_module_config",
|
/external/tensorflow/tensorflow/compiler/xla/service/gpu/ |
D | nvptx_compiler.cc | 70 const HloModuleConfig& hlo_module_config) { in PrintCantFindCudaMessage() argument 74 for (const auto& dir : CandidateCudaRoots(hlo_module_config)) { in PrintCantFindCudaMessage() 84 string GetLibdeviceDir(const HloModuleConfig& hlo_module_config) { in GetLibdeviceDir() argument 85 for (const string& cuda_root : CandidateCudaRoots(hlo_module_config)) { in GetLibdeviceDir() 98 hlo_module_config); in GetLibdeviceDir() 343 int cc_minor, const HloModuleConfig& hlo_module_config, bool relocatable) { in CompileGpuAsmOrGetCachedResult() argument 372 auto ptxas_config = PtxOptsFromConfig(hlo_module_config); in CompileGpuAsmOrGetCachedResult() 386 if (!hlo_module_config.debug_options() in CompileGpuAsmOrGetCachedResult() 391 hlo_module_config); in CompileGpuAsmOrGetCachedResult() 414 hlo_module_config); in CompileGpuAsmOrGetCachedResult()
|
D | ir_emitter_nested.cc | 38 IrEmitterNested::IrEmitterNested(const HloModuleConfig& hlo_module_config, in IrEmitterNested() argument 41 : IrEmitter(hlo_module_config, ir_emitter_context, /*is_nested=*/true), in IrEmitterNested() 45 const HloModuleConfig& hlo_module_config, in Create() argument 49 hlo_module_config, nested_computation, ir_emitter_context)); in Create()
|
D | ir_emitter_nested.h | 43 const HloModuleConfig& hlo_module_config, 67 IrEmitterNested(const HloModuleConfig& hlo_module_config,
|
D | gemm_algorithm_picker.cc | 67 const HloModuleConfig& hlo_module_config = gemm->GetModule()->config(); in DoUncachedGemmAutotune() local 69 hlo_module_config.debug_options().xla_gpu_autotune_level() > 1; in DoUncachedGemmAutotune() 71 stream, allocator, PtxOptsFromConfig(hlo_module_config), in DoUncachedGemmAutotune() 74 BufferComparator comparator(gemm->shape(), hlo_module_config); in DoUncachedGemmAutotune()
|
D | stream_executor_util.cc | 226 se::GpuAsmOpts PtxOptsFromConfig(const HloModuleConfig& hlo_module_config) { in PtxOptsFromConfig() argument 228 hlo_module_config.debug_options().xla_gpu_asm_extra_flags(); in PtxOptsFromConfig() 232 hlo_module_config.debug_options().xla_gpu_disable_gpuasm_optimizations(), in PtxOptsFromConfig() 233 hlo_module_config.debug_options().xla_gpu_cuda_data_dir(), extra_flags); in PtxOptsFromConfig()
|
D | gpu_conv_algorithm_picker.cc | 389 const HloModuleConfig& hlo_module_config = instr->GetModule()->config(); in PickBestAlgorithmNoCacheCuda() local 391 hlo_module_config.debug_options().xla_gpu_autotune_level(); in PickBestAlgorithmNoCacheCuda() 404 stream, allocator, PtxOptsFromConfig(hlo_module_config)); in PickBestAlgorithmNoCacheCuda() 464 stream, allocator, PtxOptsFromConfig(hlo_module_config)); in PickBestAlgorithmNoCacheCuda() 565 comparator.emplace(result_shape, hlo_module_config); in PickBestAlgorithmNoCacheCuda() 640 !hlo_module_config.debug_options().xla_gpu_deterministic_ops()) { in PickBestAlgorithmNoCacheCuda()
|
D | stream_executor_util.h | 79 se::GpuAsmOpts PtxOptsFromConfig(const HloModuleConfig& hlo_module_config);
|
D | nvptx_compiler.h | 79 int cc_minor, const HloModuleConfig& hlo_module_config, bool relocatable);
|
D | elemental_ir_emitter.cc | 73 const HloModuleConfig& hlo_module_config, llvm::Module* module, in GpuElementalIrEmitter() argument 76 hlo_module_config_(hlo_module_config), in GpuElementalIrEmitter()
|
D | elemental_ir_emitter.h | 46 GpuElementalIrEmitter(const HloModuleConfig& hlo_module_config,
|
D | ir_emitter.h | 116 explicit IrEmitter(const HloModuleConfig& hlo_module_config,
|
D | ir_emitter_unnested.h | 150 const HloModuleConfig& hlo_module_config, 240 IrEmitterUnnested(const HloModuleConfig& hlo_module_config,
|
D | ir_emitter.cc | 79 IrEmitter::IrEmitter(const HloModuleConfig& hlo_module_config, in IrEmitter() argument 87 hlo_module_config_(hlo_module_config) { in IrEmitter()
|
/external/tensorflow/tensorflow/compiler/xla/service/gpu/tests/ |
D | BUILD | 117 "//tensorflow/compiler/xla/service:hlo_module_config", 144 "//tensorflow/compiler/xla/service:hlo_module_config", 171 "//tensorflow/compiler/xla/service:hlo_module_config", 198 "//tensorflow/compiler/xla/service:hlo_module_config", 225 "//tensorflow/compiler/xla/service:hlo_module_config", 252 "//tensorflow/compiler/xla/service:hlo_module_config", 277 "//tensorflow/compiler/xla/service:hlo_module_config", 315 "//tensorflow/compiler/xla/service:hlo_module_config", 327 "//tensorflow/compiler/xla/service:hlo_module_config", 358 "//tensorflow/compiler/xla/service:hlo_module_config", [all …]
|
/external/tensorflow/tensorflow/compiler/xla/service/cpu/ |
D | dot_op_emitter.cc | 131 const HloModuleConfig& hlo_module_config, 240 mlir::MLIRContext* mlir_context, const HloModuleConfig& hlo_module_config, in DotOpEmitter() argument 251 hlo_module_config_(hlo_module_config), in DotOpEmitter() 1044 mlir::MLIRContext* mlir_context, const HloModuleConfig& hlo_module_config, in EmitNonBatchDotOperation() argument 1054 hlo_module_config, target_machine_features); in EmitNonBatchDotOperation() 1128 mlir::MLIRContext* mlir_context, const HloModuleConfig& hlo_module_config, in EmitBatchDotOperation() argument 1186 executable_run_options_value, b, mlir_context, hlo_module_config, in EmitBatchDotOperation() 1237 const HloModuleConfig& hlo_module_config, in EmitDotOperation() argument 1247 hlo_module_config, target_machine_features); in EmitDotOperation() 1253 hlo_module_config, target_machine_features); in EmitDotOperation()
|
D | dot_op_emitter.h | 68 const HloModuleConfig& hlo_module_config,
|
D | BUILD | 394 "//tensorflow/compiler/xla/service:hlo_module_config", 461 "//tensorflow/compiler/xla/service:hlo_module_config", 493 "//tensorflow/compiler/xla/service:hlo_module_config", 522 "//tensorflow/compiler/xla/service:hlo_module_config", 1086 "//tensorflow/compiler/xla/service:hlo_module_config",
|
/external/tensorflow/tensorflow/compiler/mlir/tools/kernel_gen/transforms/ |
D | gpu_kernel_to_blob_pass.cc | 235 const xla::HloModuleConfig& hlo_module_config) { in GetLibdeviceDir() argument 237 hlo_module_config.debug_options().xla_gpu_cuda_data_dir())) { in GetLibdeviceDir()
|
D | BUILD | 141 "//tensorflow/compiler/xla/service:hlo_module_config",
|
/external/tensorflow/tensorflow/compiler/xla/service/interpreter/ |
D | BUILD | 50 "//tensorflow/compiler/xla/service:hlo_module_config", 119 "//tensorflow/compiler/xla/service:hlo_module_config",
|
/external/tensorflow/tensorflow/compiler/xla/service/llvm_ir/ |
D | BUILD | 77 "//tensorflow/compiler/xla/service:hlo_module_config",
|
/external/tensorflow/tensorflow/stream_executor/tpu/ |
D | BUILD | 55 "//tensorflow/compiler/xla/service:hlo_module_config",
|