Home
last modified time | relevance | path

Searched refs:host_dst (Results 1 – 21 of 21) sorted by relevance

/external/tensorflow/tensorflow/compiler/xla/service/interpreter/
Dexecutor.cc50 bool XlaInterpreterExecutor::Memcpy(Stream *stream, void *host_dst, in Memcpy() argument
53 AsExecutorStream(stream)->EnqueueTask([this, host_dst, dev_src, size]() { in Memcpy()
54 port::Status ok = SynchronousMemcpy(host_dst, dev_src, size); in Memcpy()
76 void *host_dst, const DeviceMemoryBase &dev_src, uint64 size) { in SynchronousMemcpy() argument
77 memcpy(host_dst, dev_src.opaque(), size); in SynchronousMemcpy()
Dexecutor.h83 bool Memcpy(Stream *stream, void *host_dst, const DeviceMemoryBase &pop_src,
119 port::Status SynchronousMemcpy(void *host_dst,
/external/tensorflow/tensorflow/stream_executor/host/
Dhost_gpu_executor.cc66 bool HostExecutor::Memcpy(Stream *stream, void *host_dst, in Memcpy() argument
72 [host_dst, src_mem, size]() { memcpy(host_dst, src_mem, size); }); in Memcpy()
137 port::Status HostExecutor::SynchronousMemcpy(void *host_dst, in SynchronousMemcpy() argument
140 memcpy(host_dst, gpu_src.opaque(), size); in SynchronousMemcpy()
Dhost_gpu_executor.h75 bool Memcpy(Stream *stream, void *host_dst, const DeviceMemoryBase &gpu_src,
99 port::Status SynchronousMemcpy(void *host_dst,
/external/tensorflow/tensorflow/stream_executor/
Dstream_executor_pimpl.cc638 bool StreamExecutor::SynchronousMemcpy(void *host_dst, in SynchronousMemcpy() argument
641 VLOG(1) << "Called StreamExecutor::SynchronousMemcpy(host_dst=" << host_dst in SynchronousMemcpy()
646 implementation_->SynchronousMemcpy(host_dst, device_src, size); in SynchronousMemcpy()
669 const DeviceMemoryBase &device_src, int64 size, void *host_dst) { in SynchronousMemcpyD2H() argument
672 << ", host_dst=" << host_dst << ")" << StackTraceIfVLOG10(); in SynchronousMemcpyD2H()
676 host_dst); in SynchronousMemcpyD2H()
678 result = implementation_->SynchronousMemcpy(host_dst, device_src, size); in SynchronousMemcpyD2H()
684 device_src.opaque(), host_dst, size, in SynchronousMemcpyD2H()
714 bool StreamExecutor::Memcpy(Stream *stream, void *host_dst, in Memcpy() argument
716 return implementation_->Memcpy(stream, host_dst, device_src, size); in Memcpy()
Dstream_executor_pimpl.h268 bool SynchronousMemcpy(void *host_dst, const DeviceMemoryBase &device_src,
288 int64 size, void *host_dst);
295 port::MutableArraySlice<T> host_dst) { in SynchronousMemcpyD2H() argument
296 auto host_size = host_dst.size() * sizeof(T); in SynchronousMemcpyD2H()
298 return SynchronousMemcpyD2H(device_src, host_size, host_dst.begin()); in SynchronousMemcpyD2H()
546 bool Memcpy(Stream *stream, void *host_dst,
Dtrace_listener.h62 int64 size, void* host_dst) {} in SynchronousMemcpyD2HBegin() argument
Dstream_executor_internal.h221 virtual port::Status SynchronousMemcpy(void *host_dst,
235 virtual bool Memcpy(Stream *stream, void *host_dst,
Dstream.h678 void *host_dst, uint64 size);
686 port::MutableArraySlice<ElementType> host_dst) { in ThenMemcpyD2HQuantized() argument
689 host_dst.data(), host_dst.size() * sizeof(ElementType)); in ThenMemcpyD2HQuantized()
1680 Stream &ThenMemcpy(void *host_dst, const DeviceMemoryBase &gpu_src,
1695 port::MutableArraySlice<T> host_dst) { in ThenMemcpyD2H() argument
1696 auto host_size = host_dst.size() * sizeof(T); in ThenMemcpyD2H()
1698 return ThenMemcpy(host_dst.begin(), gpu_src, host_size); in ThenMemcpyD2H()
Dstream.cc1706 dnn::QuantizedActivationMode mode, void *host_dst, uint64 size) { in ThenMemcpyD2HQuantized() argument
1707 VLOG_CALL(PARAM(gpu_unquantized_src), PARAM(mode), PARAM(host_dst), in ThenMemcpyD2HQuantized()
1713 host_dst, size)); in ThenMemcpyD2HQuantized()
4780 Stream &Stream::ThenMemcpy(void *host_dst, const DeviceMemoryBase &gpu_src, in ThenMemcpy() argument
4782 VLOG_CALL(PARAM(host_dst), PARAM(gpu_src), PARAM(size)); in ThenMemcpy()
4785 CheckError(parent_->Memcpy(this, host_dst, gpu_src, size)); in ThenMemcpy()
Ddnn.h1997 QuantizedActivationMode mode, void* host_dst, int64 size) = 0;
/external/tensorflow/tensorflow/stream_executor/cuda/
Dcuda_driver.cc1079 void* host_dst, in SynchronousMemcpyD2H() argument
1086 CHECK(PointerIsValid(host_dst)) in SynchronousMemcpyD2H()
1087 << "Destination pointer is not actually on CPU: " << host_dst; in SynchronousMemcpyD2H()
1089 CUresult res = cuMemcpyDtoH(host_dst, gpu_src, size); in SynchronousMemcpyD2H()
1094 ToString(res).c_str(), host_dst, in SynchronousMemcpyD2H()
1098 << host_dst; in SynchronousMemcpyD2H()
1149 void* host_dst, in AsynchronousMemcpyD2H() argument
1157 CHECK(PointerIsValid(host_dst)) in AsynchronousMemcpyD2H()
1158 << "Destination pointer is not actually on CPU: " << host_dst; in AsynchronousMemcpyD2H()
1160 CUresult res = cuMemcpyDtoHAsync(host_dst, gpu_src, size, stream); in AsynchronousMemcpyD2H()
[all …]
Dcuda_gpu_executor.cc610 port::Status GpuExecutor::SynchronousMemcpy(void* host_dst, in SynchronousMemcpy() argument
613 return GpuDriver::SynchronousMemcpyD2H(context_, host_dst, in SynchronousMemcpy()
655 bool GpuExecutor::Memcpy(Stream* stream, void* host_dst, in Memcpy() argument
657 return GpuDriver::AsynchronousMemcpyD2H(context_, host_dst, in Memcpy()
Dcuda_dnn.h527 dnn::QuantizedActivationMode mode, void* host_dst,
Dcuda_dnn.cc4076 dnn::QuantizedActivationMode mode, void* host_dst, int64 size) { in DoMemcpyD2HQuantized() argument
/external/tensorflow/tensorflow/stream_executor/rocm/
Drocm_driver.cc892 GpuContext* context, void* host_dst, hipDeviceptr_t gpu_src, uint64 size) { in SynchronousMemcpyD2H() argument
894 hipError_t res = tensorflow::wrap::hipMemcpyDtoH(host_dst, gpu_src, size); in SynchronousMemcpyD2H()
899 ToString(res).c_str(), host_dst, in SynchronousMemcpyD2H()
903 << host_dst; in SynchronousMemcpyD2H()
941 void* host_dst, in AsynchronousMemcpyD2H() argument
947 tensorflow::wrap::hipMemcpyDtoHAsync(host_dst, gpu_src, size, stream); in AsynchronousMemcpyD2H()
952 ToString(res).c_str(), host_dst, absl::bit_cast<void*>(gpu_src), size, in AsynchronousMemcpyD2H()
958 << host_dst << " on stream " << stream; in AsynchronousMemcpyD2H()
Drocm_gpu_executor.cc491 port::Status GpuExecutor::SynchronousMemcpy(void* host_dst, in SynchronousMemcpy() argument
494 return GpuDriver::SynchronousMemcpyD2H(context_, host_dst, in SynchronousMemcpy()
536 bool GpuExecutor::Memcpy(Stream* stream, void* host_dst, in Memcpy() argument
538 return GpuDriver::AsynchronousMemcpyD2H(context_, host_dst, in Memcpy()
Drocm_dnn.h510 dnn::QuantizedActivationMode mode, void* host_dst,
Drocm_dnn.cc3973 dnn::QuantizedActivationMode mode, void* host_dst, int64 size) { in DoMemcpyD2HQuantized() argument
/external/tensorflow/tensorflow/stream_executor/gpu/
Dgpu_executor.h130 port::Status SynchronousMemcpy(void* host_dst,
145 bool Memcpy(Stream* stream, void* host_dst, const DeviceMemoryBase& gpu_src,
Dgpu_driver.h280 static port::Status SynchronousMemcpyD2H(GpuContext* context, void* host_dst,
292 static bool AsynchronousMemcpyD2H(GpuContext* context, void* host_dst,