Home
last modified time | relevance | path

Searched refs:gpu_stream (Results 1 – 25 of 30) sorted by relevance

12

/external/tensorflow/tensorflow/compiler/xla/service/gpu/
Dnccl_all_to_all_thunk.cc87 se::gpu::GpuStreamHandle gpu_stream = se::gpu::AsGpuStreamValue(&stream); in RunAllToAll() local
120 gpu_stream)); in RunAllToAll()
123 gpu_stream)); in RunAllToAll()
144 /*rank=*/i, comm, gpu_stream)); in RunAllToAll()
146 /*rank=*/i, comm, gpu_stream)); in RunAllToAll()
Dnccl_collective_permute_thunk.cc206 se::gpu::GpuStreamHandle gpu_stream = se::gpu::AsGpuStreamValue(&stream); in RunCollectivePermute() local
214 static_cast<const void*>(comm), gpu_stream); in RunCollectivePermute()
216 *target_id, comm, gpu_stream)); in RunCollectivePermute()
225 static_cast<const void*>(comm), gpu_stream); in RunCollectivePermute()
227 *source_id, comm, gpu_stream)); in RunCollectivePermute()
Dnccl_all_gather_thunk.cc71 se::gpu::GpuStreamHandle gpu_stream = se::gpu::AsGpuStreamValue(&stream); in RunAllGather() local
89 gpu_stream); in RunAllGather()
92 send_buffer, recv_buffer, element_count, dtype, comm, gpu_stream)); in RunAllGather()
Dcustom_call_thunk.cc59 auto gpu_stream = se::gpu::AsGpuStreamValue(params.stream); in ExecuteOnStream() local
61 call_target_(gpu_stream, buffers.data(), opaque_.data(), opaque_.size(), in ExecuteOnStream()
Dnccl_all_reduce_thunk.cc51 se::gpu::GpuStreamHandle gpu_stream = se::gpu::AsGpuStreamValue(&stream); in RunAllReduce() local
68 gpu_stream); in RunAllReduce()
72 comm, gpu_stream)); in RunAllReduce()
379 se::gpu::GpuStreamHandle gpu_stream = se::gpu::AsGpuStreamValue(&stream); in RunReduceScatter() local
407 gpu_stream); in RunReduceScatter()
410 comm, gpu_stream)); in RunReduceScatter()
Druntime_intrinsics.cc41 config.gpu_stream = stream_handle; in AssertOnGpu()
Dcusolver_context.cc302 const gpuStream_t* gpu_stream = in Create() local
305 TF_RETURN_IF_ERROR(ConvertStatus(GpuSolverSetStream(handle, *gpu_stream))); in Create()
Dbef_thunk.cc246 tfrt::gpu::wrapper::Stream(se_gpu_stream->gpu_stream())); in CreateGpuStream()
/external/tensorflow/tensorflow/compiler/xla/stream_executor/
Dexecutor_cache.cc75 if (config.gpu_stream) { in Get()
80 if (executor->FindAllocatedStream(config.gpu_stream)) { in Get()
87 absl::StrFormat("No executors own stream %p", config.gpu_stream)); in Get()
Dplatform.h83 void* gpu_stream = nullptr; member
Dstream_executor_pimpl.h545 Stream* FindAllocatedStream(void* gpu_stream) { in FindAllocatedStream() argument
546 return implementation()->FindAllocatedStream(gpu_stream); in FindAllocatedStream()
/external/tensorflow/tensorflow/compiler/xla/stream_executor/gpu/
DBUILD98 ":gpu_stream",
156 hdrs = if_gpu_is_configured(["gpu_stream.h"]),
165 name = "gpu_stream",
166 srcs = if_gpu_is_configured(["gpu_stream.cc"]),
167 hdrs = if_gpu_is_configured(["gpu_stream.h"]),
194 ":gpu_stream",
Dgpu_stream.h70 GpuStreamHandle gpu_stream() const { in gpu_stream() function
76 GpuStreamHandle cuda_stream() const { return gpu_stream(); } in cuda_stream()
Dgpu_timer.cc76 parent_->gpu_context(), start_event_, stream->gpu_stream()); in Start()
85 parent_->gpu_context(), stop_event_, stream->gpu_stream()); in Stop()
Dgpu_event.cc41 stream->gpu_stream()); in Record()
Dgpu_stream.cc58 return AsGpuStream(stream)->gpu_stream(); in AsGpuStreamValue()
Dgpu_executor.h302 Stream* FindAllocatedStream(void* gpu_stream) override { in FindAllocatedStream() argument
304 auto it = alive_gpu_streams_.find(gpu_stream); in FindAllocatedStream()
/external/tensorflow/tensorflow/stream_executor/gpu/
DBUILD104 hdrs = if_gpu_is_configured(["gpu_stream.h"]),
109 name = "gpu_stream",
110 hdrs = if_gpu_is_configured(["gpu_stream.h"]),
111 deps = ["//tensorflow/compiler/xla/stream_executor/gpu:gpu_stream"],
/external/tensorflow/tensorflow/compiler/xla/stream_executor/cuda/
Dstream_search_test.cc35 config.gpu_stream = bad_ptr; in TEST_F()
59 c.gpu_stream = gpu_ptr; in TEST_F()
Dcuda_platform.cc162 if (config.gpu_stream) { in GetExecutor()
/external/tensorflow/tensorflow/core/profiler/utils/
Dgroup_events_test.cc235 auto gpu_stream = device_plane_builder.GetOrCreateLine(0); in TEST() local
244 CreateXEvent(&device_plane_builder, &gpu_stream, kTF1GpuEvent, 200, 300, in TEST()
257 CreateXEvent(&device_plane_builder, &gpu_stream, kLegacyGpuEvent, 300, 400, in TEST()
269 CreateXEvent(&device_plane_builder, &gpu_stream, kEagerOpGpuEvent, 400, 500, in TEST()
281 CreateXEvent(&device_plane_builder, &gpu_stream, kEagerFuncGpuEvent, 500, 600, in TEST()
/external/tensorflow/tensorflow/compiler/tf2xla/kernels/
Dlight_outside_compilation.cc325 const void* gpu_stream = reinterpret_cast<const void*>( in ReinitializeGpuDevice() local
328 context, gpu_stream, in ReinitializeGpuDevice()
413 config.gpu_stream = stream_handle; in CallTfKernel()
/external/tensorflow/tensorflow/core/common_runtime/gpu/
Dgpu_device.h61 void Reinitialize(OpKernelContext* context, const void* gpu_stream,
65 void Reinitialize(OpKernelContext* context, const void* gpu_stream,
Dgpu_device.cc128 void Reinitialize(OpKernelContext* context, const gpuStream_t* gpu_stream, in Reinitialize() argument
139 stream_ = gpu_stream; in Reinitialize()
903 const void* gpu_stream, in Reinitialize() argument
911 ->Reinitialize(context, static_cast<const gpuStream_t*>(gpu_stream), in Reinitialize()
916 const void* gpu_stream, in Reinitialize() argument
921 ->Reinitialize(context, static_cast<const gpuStream_t*>(gpu_stream), in Reinitialize()
1165 const gpuStream_t* gpu_stream = reinterpret_cast<const gpuStream_t*>( in ReinitializeDevice() local
1167 concrete_device->Reinitialize(context, gpu_stream, tf_device_id_, allocator, in ReinitializeDevice()
/external/tensorflow/tensorflow/stream_executor/rocm/
Drocm_platform.cc132 if (config.gpu_stream) { in GetExecutor()

12