Home
last modified time | relevance | path

Searched defs:stream_exec (Results 1 – 25 of 28) sorted by relevance

12

/external/tensorflow/tensorflow/compiler/xla/service/gpu/
Damdgpu_compiler.cc74 HloModule* hlo_module, se::StreamExecutor* stream_exec, in OptimizeHloConvolutionCanonicalization()
95 GpuVersion AMDGPUCompiler::GetGpuVersion(se::StreamExecutor* stream_exec) { in GetGpuVersion()
117 se::StreamExecutor* stream_exec, in CompileTargetBinary()
Dnvptx_compiler.cc108 HloModule* hlo_module, se::StreamExecutor* stream_exec, in OptimizeHloConvolutionCanonicalization()
161 HloModule* hlo_module, se::StreamExecutor* stream_exec, in OptimizeHloPostLayoutAssignment()
287 GpuVersion NVPTXCompiler::GetGpuVersion(se::StreamExecutor* stream_exec) { in GetGpuVersion()
304 se::StreamExecutor* stream_exec, in CompileTargetBinary()
342 se::StreamExecutor* stream_exec, const string& ptx, int cc_major, in CompileGpuAsmOrGetCachedResult()
447 se::StreamExecutor* stream_exec, std::vector<std::vector<uint8>> modules) { in LinkModules()
Dgemm_algorithm_picker.h32 GemmAlgorithmPicker(se::StreamExecutor* stream_exec, in GemmAlgorithmPicker()
Dgpu_conv_algorithm_picker.h40 GpuConvAlgorithmPicker(se::StreamExecutor* stream_exec, in GpuConvAlgorithmPicker()
Dgpu_compiler.cc150 HloModule* hlo_module, se::StreamExecutor* stream_exec, in OptimizeHloModule()
403 HloModule* hlo_module, se::StreamExecutor* stream_exec, in OptimizeHloPostLayoutAssignment()
490 std::unique_ptr<HloModule> module, se::StreamExecutor* stream_exec, in RunHloPasses()
678 se::StreamExecutor* stream_exec, in CompileToTargetBinary()
856 std::unique_ptr<HloModule> module, se::StreamExecutor* stream_exec, in RunBackend()
963 GpuDeviceInfo GetGpuDeviceInfo(se::StreamExecutor* stream_exec) { in GetGpuDeviceInfo()
1100 absl::string_view entry_function_name, se::StreamExecutor* stream_exec, in CompileLmhloToExecutable()
Dgpu_compiler.h130 se::StreamExecutor* stream_exec, in LinkModules()
Dstream_executor_util.cc177 tensorflow::mutex_lock LockGpu(const se::StreamExecutor* stream_exec) { in LockGpu()
196 absl::Span<const uint8> cubin_data, se::StreamExecutor* stream_exec) { in CreateKernel()
Dgpu_conv_algorithm_picker.cc103 se::StreamExecutor* stream_exec) { in GetAlgorithms()
127 se::DeviceMemoryBase result_buffer, se::StreamExecutor* stream_exec, in GetMIOpenAlgorithms()
/external/tensorflow/tensorflow/core/common_runtime/gpu/
Dgpu_debug_allocator_test.cc49 auto stream_exec = ExecutorForPlatformGpuId(platform_gpu_id); in TEST() local
145 auto stream_exec = ExecutorForPlatformGpuId(platform_gpu_id); in TEST() local
187 auto stream_exec = ExecutorForPlatformGpuId(platform_gpu_id); in TEST() local
/external/tensorflow/tensorflow/compiler/xla/
Ddevice_util.h32 string DeviceIdentifier(se::StreamExecutor* stream_exec) { in DeviceIdentifier()
/external/tensorflow/tensorflow/compiler/xla/service/interpreter/
Dcompiler.cc105 std::unique_ptr<HloModule> hlo_module, se::StreamExecutor* stream_exec, in RunBackend()
130 std::vector<std::vector<se::StreamExecutor*>> stream_exec, in Compile()
/external/tensorflow/tensorflow/compiler/xla/tests/
Dllvm_compiler_test.cc45 HloModule* hlo_module, se::StreamExecutor* stream_exec, in OptimizeHloConvolutionCanonicalization()
51 HloModule* hlo_module, se::StreamExecutor* stream_exec, in OptimizeHloPostLayoutAssignment()
62 GpuVersion gpu_version, se::StreamExecutor* stream_exec, bool relocatable, in CompileTargetBinary()
/external/tensorflow/tensorflow/stream_executor/cuda/
Dredzone_allocator_test.cc55 StreamExecutor* stream_exec = platform->ExecutorForDevice(0).ValueOrDie(); in TEST() local
130 StreamExecutor* stream_exec = platform->ExecutorForDevice(0).ValueOrDie(); in TEST() local
/external/tensorflow/tensorflow/stream_executor/
Devent.cc24 Event::Event(StreamExecutor* stream_exec) in Event()
Dstream_executor_pimpl.cc75 ScopedTracer(StreamExecutor *stream_exec, BeginCallT begin_call, in ScopedTracer()
116 MakeScopedTracer(StreamExecutor *stream_exec, BeginCallT begin_call, in MakeScopedTracer()
/external/tensorflow/tensorflow/stream_executor/gpu/
Dgpu_activation.cc34 StreamExecutor* stream_exec) in ScopedActivateExecutorContext()
/external/tensorflow/tensorflow/core/kernels/
Dconv_ops_gpu.h34 inline bool IsVoltaOrLater(const se::StreamExecutor& stream_exec) { in IsVoltaOrLater()
164 se::StreamExecutor* stream_exec) const { in ShouldIncludeWinogradNonfusedAlgo()
Dgpu_utils.cc135 se::StreamExecutor* stream_exec, in LogConvAutotuneResults()
179 se::StreamExecutor* stream_exec, absl::Span<const AutotuneResult> results) { in LogFusedConvForwardAutotuneResults()
/external/tensorflow/tensorflow/core/common_runtime/device/
Ddevice_host_allocator.h29 explicit DeviceHostAllocator(se::StreamExecutor* stream_exec, int numa_node, in DeviceHostAllocator()
Ddevice_mem_allocator.h31 explicit DeviceMemAllocator(se::StreamExecutor* stream_exec, in DeviceMemAllocator()
Ddevice_event_mgr_test.cc112 auto stream_exec = GPUMachineManager()->ExecutorForDevice(0).ValueOrDie(); in TEST() local
121 auto stream_exec = GPUMachineManager()->ExecutorForDevice(0).ValueOrDie(); in TEST() local
443 auto stream_exec = GPUMachineManager()->ExecutorForDevice(0).ValueOrDie(); in BM_no_ops() local
/external/tensorflow/tensorflow/stream_executor/tpu/
Dtpu_executable_interface.cc59 auto stream_exec = stream->parent(); in AllocateOutputMemoryWithInputReuse() local
/external/tensorflow/tensorflow/compiler/xla/service/gpu/tests/
Dmlir_gpu_test_base.cc53 se::StreamExecutor* stream_exec = stream->parent(); in CompileMlirModule() local
/external/tensorflow/tensorflow/compiler/xla/service/
Dcompiler.h233 std::vector<std::vector<se::StreamExecutor*>> stream_exec, in Compile()
/external/tensorflow/tensorflow/core/tpu/
Dtpu_on_demand_compiler.cc277 std::vector<std::vector<stream_executor::StreamExecutor*>> stream_exec, in Compile()

12