Home
last modified time | relevance | path

Searched refs:gpu_dst (Results 1 – 12 of 12) sorted by relevance

/external/tensorflow/tensorflow/stream_executor/host/
Dhost_gpu_executor.cc76 bool HostExecutor::Memcpy(Stream *stream, DeviceMemoryBase *gpu_dst, in Memcpy() argument
78 void *dst_mem = gpu_dst->opaque(); in Memcpy()
87 DeviceMemoryBase *gpu_dst, in MemcpyDeviceToDevice() argument
90 void *dst_mem = gpu_dst->opaque(); in MemcpyDeviceToDevice()
130 port::Status HostExecutor::SynchronousMemcpy(DeviceMemoryBase *gpu_dst, in SynchronousMemcpy() argument
133 memcpy(gpu_dst->opaque(), host_src, size); in SynchronousMemcpy()
145 DeviceMemoryBase *gpu_dst, const DeviceMemoryBase &gpu_src, uint64 size) { in SynchronousMemcpyDeviceToDevice() argument
146 memcpy(gpu_dst->opaque(), gpu_src.opaque(), size); in SynchronousMemcpyDeviceToDevice()
Dhost_gpu_executor.h77 bool Memcpy(Stream *stream, DeviceMemoryBase *gpu_dst, const void *host_src,
79 bool MemcpyDeviceToDevice(Stream *stream, DeviceMemoryBase *gpu_dst,
97 port::Status SynchronousMemcpy(DeviceMemoryBase *gpu_dst,
102 port::Status SynchronousMemcpyDeviceToDevice(DeviceMemoryBase *gpu_dst,
/external/tensorflow/tensorflow/stream_executor/cuda/
Dcuda_driver.cc1103 CUdeviceptr gpu_dst, in SynchronousMemcpyH2D() argument
1110 CHECK(PointerIsValid(gpu_dst)) in SynchronousMemcpyH2D()
1111 << "Destination pointer is not actually on GPU: " << gpu_dst; in SynchronousMemcpyH2D()
1113 CUresult res = cuMemcpyHtoD(gpu_dst, host_src, size); in SynchronousMemcpyH2D()
1118 ToString(res).c_str(), absl::bit_cast<void*>(gpu_dst), host_src, size, in SynchronousMemcpyH2D()
1126 CUdeviceptr gpu_dst, in SynchronousMemcpyD2D() argument
1133 CHECK(PointerIsValid(gpu_dst)) in SynchronousMemcpyD2D()
1134 << "Destination pointer is not actually on GPU: " << gpu_dst; in SynchronousMemcpyD2D()
1136 CUresult res = cuMemcpyDtoD(gpu_dst, gpu_src, size); in SynchronousMemcpyD2D()
1141 ToString(res).c_str(), absl::bit_cast<void*>(gpu_dst), in SynchronousMemcpyD2D()
[all …]
Dcuda_gpu_executor.cc604 port::Status GpuExecutor::SynchronousMemcpy(DeviceMemoryBase* gpu_dst, in SynchronousMemcpy() argument
606 return GpuDriver::SynchronousMemcpyH2D(context_, AsCudaDevicePtr(gpu_dst), in SynchronousMemcpy()
618 DeviceMemoryBase* gpu_dst, const DeviceMemoryBase& gpu_src, uint64 size) { in SynchronousMemcpyDeviceToDevice() argument
619 return GpuDriver::SynchronousMemcpyD2D(context_, AsCudaDevicePtr(gpu_dst), in SynchronousMemcpyDeviceToDevice()
662 bool GpuExecutor::Memcpy(Stream* stream, DeviceMemoryBase* gpu_dst, in Memcpy() argument
664 return GpuDriver::AsynchronousMemcpyH2D(context_, AsCudaDevicePtr(gpu_dst), in Memcpy()
670 DeviceMemoryBase* gpu_dst, in MemcpyDeviceToDevice() argument
673 return GpuDriver::AsynchronousMemcpyD2D(context_, AsCudaDevicePtr(gpu_dst), in MemcpyDeviceToDevice()
/external/tensorflow/tensorflow/stream_executor/rocm/
Drocm_driver.cc908 GpuContext* context, hipDeviceptr_t gpu_dst, const void* host_src, in SynchronousMemcpyH2D() argument
912 gpu_dst, const_cast<void*>(host_src), size); in SynchronousMemcpyH2D()
917 ToString(res).c_str(), absl::bit_cast<void*>(gpu_dst), host_src, size, in SynchronousMemcpyH2D()
925 GpuContext* context, hipDeviceptr_t gpu_dst, hipDeviceptr_t gpu_src, in SynchronousMemcpyD2D() argument
928 hipError_t res = tensorflow::wrap::hipMemcpyDtoD(gpu_dst, gpu_src, size); in SynchronousMemcpyD2D()
933 ToString(res).c_str(), absl::bit_cast<void*>(gpu_dst), in SynchronousMemcpyD2D()
963 hipDeviceptr_t gpu_dst, in AsynchronousMemcpyH2D() argument
969 gpu_dst, const_cast<void*>(host_src), size, stream); in AsynchronousMemcpyH2D()
974 ToString(res).c_str(), absl::bit_cast<void*>(gpu_dst), host_src, size, in AsynchronousMemcpyH2D()
984 hipDeviceptr_t gpu_dst, in AsynchronousMemcpyD2D() argument
[all …]
Drocm_gpu_executor.cc485 port::Status GpuExecutor::SynchronousMemcpy(DeviceMemoryBase* gpu_dst, in SynchronousMemcpy() argument
487 return GpuDriver::SynchronousMemcpyH2D(context_, AsROCmDevicePtr(gpu_dst), in SynchronousMemcpy()
499 DeviceMemoryBase* gpu_dst, const DeviceMemoryBase& gpu_src, uint64 size) { in SynchronousMemcpyDeviceToDevice() argument
500 return GpuDriver::SynchronousMemcpyD2D(context_, AsROCmDevicePtr(gpu_dst), in SynchronousMemcpyDeviceToDevice()
543 bool GpuExecutor::Memcpy(Stream* stream, DeviceMemoryBase* gpu_dst, in Memcpy() argument
545 return GpuDriver::AsynchronousMemcpyH2D(context_, AsROCmDevicePtr(gpu_dst), in Memcpy()
551 DeviceMemoryBase* gpu_dst, in MemcpyDeviceToDevice() argument
554 return GpuDriver::AsynchronousMemcpyD2D(context_, AsROCmDevicePtr(gpu_dst), in MemcpyDeviceToDevice()
/external/tensorflow/tensorflow/stream_executor/
Dstream_executor_internal.h219 virtual port::Status SynchronousMemcpy(DeviceMemoryBase *gpu_dst,
225 DeviceMemoryBase *gpu_dst, const DeviceMemoryBase &gpu_src,
237 virtual bool Memcpy(Stream *stream, DeviceMemoryBase *gpu_dst,
239 virtual bool MemcpyDeviceToDevice(Stream *stream, DeviceMemoryBase *gpu_dst,
Dtrace_listener.h56 DeviceMemoryBase* gpu_dst) {} in SynchronousMemcpyH2DBegin() argument
Dstream.h1687 Stream &ThenMemcpy(DeviceMemoryBase *gpu_dst, const void *host_src,
1706 DeviceMemory<T> *gpu_dst) { in ThenMemcpyH2D() argument
1708 CHECK(gpu_dst->size() == 0 || gpu_dst->size() >= host_size); in ThenMemcpyH2D()
1709 return ThenMemcpy(gpu_dst, host_src.begin(), host_size); in ThenMemcpyH2D()
1715 Stream &ThenMemcpy(DeviceMemoryBase *gpu_dst, const DeviceMemoryBase &gpu_src,
1721 Stream &ThenMemcpyD2D(DeviceMemoryBase *gpu_dst, in ThenMemcpyD2D() argument
1723 return ThenMemcpy(gpu_dst, gpu_src, size); in ThenMemcpyD2D()
Dstream.cc4793 Stream &Stream::ThenMemcpy(DeviceMemoryBase *gpu_dst, const void *host_src, in ThenMemcpy() argument
4795 VLOG_CALL(PARAM(gpu_dst), PARAM(host_src), PARAM(size)); in ThenMemcpy()
4798 CheckError(parent_->Memcpy(this, gpu_dst, host_src, size)); in ThenMemcpy()
4806 Stream &Stream::ThenMemcpy(DeviceMemoryBase *gpu_dst, in ThenMemcpy() argument
4808 VLOG_CALL(PARAM(gpu_dst), PARAM(gpu_src), PARAM(size)); in ThenMemcpy()
4811 CheckError(parent_->MemcpyDeviceToDevice(this, gpu_dst, gpu_src, size)); in ThenMemcpy()
/external/tensorflow/tensorflow/stream_executor/gpu/
Dgpu_executor.h127 port::Status SynchronousMemcpy(DeviceMemoryBase* gpu_dst,
134 port::Status SynchronousMemcpyDeviceToDevice(DeviceMemoryBase* gpu_dst,
148 bool Memcpy(Stream* stream, DeviceMemoryBase* gpu_dst, const void* host_src,
151 bool MemcpyDeviceToDevice(Stream* stream, DeviceMemoryBase* gpu_dst,
Dgpu_driver.h283 GpuDevicePtr gpu_dst,
286 GpuDevicePtr gpu_dst,
295 static bool AsynchronousMemcpyH2D(GpuContext* context, GpuDevicePtr gpu_dst,
298 static bool AsynchronousMemcpyD2D(GpuContext* context, GpuDevicePtr gpu_dst,