Searched refs:ar_input_addr_ (Results 1 – 3 of 3) sorted by relevance
/third_party/mindspore/mindspore/ccsrc/runtime/device/gpu/ |
D | gpu_bucket.cc | 71 …ar_input_addr_ = static_cast<uint8_t *>(GPUMemoryAllocator::GetInstance().AllocTensorMem(total_siz… in AllocateAllReduceAddr() 74 uint8_t *memcpy_output = ar_input_addr_; in AllocateAllReduceAddr() 86 if (ar_input_addr_ != nullptr) { in FreeAllDeviceMem() 87 FreeDeviceMem(ar_input_addr_); in FreeAllDeviceMem() 88 ar_input_addr_ = nullptr; in FreeAllDeviceMem() 106 cudaMemsetAsync(ar_input_addr_, 0, total_size_, static_cast<cudaStream_t>(compute_stream_)), in CopyTensorToContiguousMemory() 150 …(*all_reduce_funcptr)(ar_input_addr_, ar_output_addr_, total_size_ / type_size, nccl_data_type_ite… in LaunchAllReduce()
|
/third_party/mindspore/mindspore/ccsrc/runtime/device/ascend/ |
D | ascend_bucket.cc | 60 ar_input_addr_ = runtime_instance->MallocCommunicationMemFromMemPool(total_size); in AllocateAllReduceAddr() 64 uint8_t *memcpy_output = ar_input_addr_; in AllocateAllReduceAddr() 78 if (ar_input_addr_ != nullptr) { in FreeAllDeviceMem() 79 uint8_t *origin_dev_addr = ar_input_addr_ - kMemAlignSize; in FreeAllDeviceMem() 81 ar_input_addr_ = nullptr; in FreeAllDeviceMem() 151 …auto hccl_result = hccl::HcclAdapter::GetInstance().HcclAllReduce(ar_input_addr_, ar_output_addr_,… in LaunchAllReduce() 164 launch_atomic_clean_->SetInputAddr(ar_input_addr_); in CleanAllReduceInputAddr()
|
/third_party/mindspore/mindspore/ccsrc/runtime/device/ |
D | bucket.h | 44 ar_input_addr_(nullptr), in Bucket() 68 uint8_t *ar_input_addr_; variable
|