/third_party/mindspore/mindspore/ccsrc/runtime/device/gpu/distribution/ |
D | mpi_wrapper.cc | 26 MPIWrapper::MPIWrapper() : rank_id_(0), rank_size_(0), local_rank_id_(0) { Init(); } in MPIWrapper() 61 if (rank_id_ == ranks[0]) { in CreateCommGroup() 67 int global_rank[1] = {rank_id_}; in CreateCommGroup() 114 CHECK_RET(MPI_Comm_rank(MPI_COMM_WORLD, &rank_id_), MPI_SUCCESS, "Failed to init mpi rank id."); in Init() 122 if (rank_id_ == 0) { in Init() 132 NcclGroupInfo world_group = {rank_size_, rank_id_, unique_id, nullptr, world_group_ranks}; in Init() 144 CHECK_RET((rank_id_ < kRankSize), true, "The rank id is not less than rank size."); in AssignLocalRankID() 145 all_host_hashs[rank_id_] = host_hash; in AssignLocalRankID() 149 if (global_rank == rank_id_) { in AssignLocalRankID() 152 if (all_host_hashs[global_rank] == all_host_hashs[rank_id_]) { in AssignLocalRankID()
|
D | mpi_wrapper.h | 51 int rank_id_; variable
|
/third_party/mindspore/mindspore/ccsrc/runtime/device/cpu/mpi/ |
D | mpi_adapter.cc | 122 auto ret = MPI_Comm_rank(MPI_COMM_WORLD, &rank_id_); in Init() 129 RAISE_EXCEPTION_WITH_PARAM("Failed to init mpi rank size!rankid:", rank_id_); in Init() 139 if (std::find(ranks.begin(), ranks.end(), rank_id_) == ranks.end()) { in AddGroup() 140 …ISE_EXCEPTION_WITH_PARAM("local rankid does not in the input rank group!local rank id:", rank_id_); in AddGroup() 156 RAISE_EXCEPTION_WITH_PARAM("create mpi group fail!rankid:", rank_id_); in AddGroup() 172 RAISE_EXCEPTION_WITH_PARAM("Get mpi group fail!rankid:", rank_id_); in ReduceScatter() 177 RAISE_EXCEPTION_WITH_PARAM("create mpi comm fail!rankid:", rank_id_); in ReduceScatter() 201 int scatter_index = GetScatterIndex(rank_id_, ranks_group); in ReduceScatterOverwriteInput() 204 RAISE_EXCEPTION_WITH_PARAM("Get mpi group fail!rankid:", rank_id_); in ReduceScatterOverwriteInput() 209 RAISE_EXCEPTION_WITH_PARAM("create mpi comm fail!rankid:", rank_id_); in ReduceScatterOverwriteInput() [all …]
|
D | mpi_adapter.h | 35 FUNC_EXPORT int GetRankId() const { return rank_id_; } in GetRankId() 53 int rank_id_{-1};
|
/third_party/mindspore/mindspore/ccsrc/runtime/device/ascend/distribute/ |
D | mpi_collective_group.cc | 24 MPICollective::MPICollective() : mpi_inited_(false), rank_id_(0), local_rank_id_(0), rank_size_(0) … in MPICollective() 65 CHECK_RET(MPI_Comm_rank(MPI_COMM_WORLD, &rank_id_), MPI_SUCCESS, "Failed to init mpi rank id!"); in Init() 69 group_info_["hccl_world_group"] = {rank_id_, rank_size_}; in Init() 81 if (static_cast<unsigned int>(rank_id_) == ranks[0]) { in CreateCommGroup() 96 int global_rank[1] = {rank_id_}; in CreateCommGroup() 117 all_host_hashs[rank_id_] = host_hash; in AssignLocalRankID() 121 if (global_rank == rank_id_) { in AssignLocalRankID() 124 if (all_host_hashs[global_rank] == all_host_hashs[rank_id_]) { in AssignLocalRankID()
|
D | mpi_collective_group.h | 54 int rank_id_; variable
|
/third_party/mindspore/mindspore/ccsrc/ps/core/ |
D | node_manager.cc | 41 rank_id = registered_nodes_info_[node_id].rank_id_; in NextRankId() 56 …MS_LOG(INFO) << "The server node id:" << item.first << " rank id:" << item.second.rank_id_ << " is… in NextRankId() 57 rank_id = item.second.rank_id_; in NextRankId() 80 node_info.rank_id_ = rank_id; in NextRankId() 96 rank_id = item.second.rank_id_; in NextRankId() 119 node_info.rank_id_ = rank_id; in NextRankId() 141 servers_meta.set_rank_id(it->second.rank_id_); in FetchServersMeta() 154 servers_meta.set_rank_id(it->second.rank_id_); in FetchAllNodesMeta() 266 server_rank_ids.push_back(registered_nodes_info_[item].rank_id_); in ResetMetadata() 283 …ond.node_role_ == NodeRole::SERVER && item.second.is_alive == false && item.second.rank_id_ == 0) { in IsWorkerOrServer0()
|
D | instance_manager.cc | 30 message_meta->set_rank_id(node_info.rank_id_); in NewInstanceAsync() 49 message_meta->set_rank_id(node_info.rank_id_); in QueryInstanceAsync() 69 message_meta->set_rank_id(node_info.rank_id_); in EnableFLSAsync() 89 message_meta->set_rank_id(node_info.rank_id_); in DisableFLSAsync()
|
D | node_info.h | 39 …NodeInfo() : ip_(""), port_(0), node_role_(NodeRole::SCHEDULER), rank_id_(UINT32_MAX), is_alive(fa… in NodeInfo() 49 uint32_t rank_id_; member
|
D | abstract_node.cc | 30 message_meta->set_rank_id(node_info_.rank_id_); in Register() 79 message_meta->set_rank_id(node_info_.rank_id_); in Broadcast() 192 message_meta->set_rank_id(node_info_.rank_id_); in Send() 223 message_meta->set_rank_id(node_info_.rank_id_); in Send() 266 message_meta->set_rank_id(node_info_.rank_id_); in Send() 316 message_meta->set_rank_id(node_info_.rank_id_); in Send() 345 message_meta->set_rank_id(node_info_.rank_id_); in CollectiveSendAsync() 457 meta->set_rank_id(node_info_.rank_id_); in Response() 507 … << ", the node id:" << node_info_.node_id_ << ", the node rank id:" << node_info_.rank_id_ in StartHeartbeatTimer() 585 info.rank_id_ = it.rank_id(); in ProcessHeartbeatResp() [all …]
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/fl/ |
D | start_fl_job_kernel.h | 75 rank_id_ = fl::worker::FLWorker::GetInstance().rank_id(); in Init() 76 if (rank_id_ == UINT32_MAX) { in Init() 80 target_server_rank_ = rank_id_ % server_num_; in Init() 114 uint32_t rank_id_; variable
|
D | get_model_kernel.h | 105 rank_id_ = fl::worker::FLWorker::GetInstance().rank_id(); in Init() 106 if (rank_id_ == UINT32_MAX) { in Init() 110 target_server_rank_ = rank_id_ % server_num_; in Init() 152 uint32_t rank_id_; variable
|
D | update_model_kernel.h | 87 rank_id_ = fl::worker::FLWorker::GetInstance().rank_id(); in Init() 88 if (rank_id_ == UINT32_MAX) { in Init() 92 target_server_rank_ = rank_id_ % server_num_; in Init() 160 uint32_t rank_id_; variable
|
/third_party/mindspore/mindspore/ccsrc/minddata/dataset/core/ |
D | config_manager.cc | 40 rank_id_(kCfgDefaultRankId), in ConfigManager() 144 if (rank_id_ == kCfgDefaultRankId) rank_id_ = rank_id; in set_rank_id()
|
D | config_manager.h | 163 int32_t rank_id() const { return rank_id_; } in rank_id() 249 int32_t rank_id_; variable
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/ps/ |
D | pserver_kernel.h | 31 : rank_id_(rank_id), pserver_num_(pserver_num), worker_num_(worker_num) {} in PServerKernel() 51 size_t rank_id_; variable
|
D | pserver_kernel.cc | 28 …LongToSize(Util::LocalShard(SizeToLong((*shape)[IntToSize(axis)]), SizeToLong(rank_id_), SizeToLon… in Shard()
|
/third_party/mindspore/mindspore/ccsrc/fl/worker/ |
D | fl_worker.h | 102 rank_id_(UINT32_MAX), in FLWorker() 134 uint32_t rank_id_; variable
|
D | fl_worker.cc | 76 rank_id_ = worker_node_->rank_id(); in Run() 154 uint32_t FLWorker::rank_id() const { return rank_id_; } in rank_id() 180 std::string FLWorker::fl_id() const { return std::to_string(rank_id_); } in fl_id()
|
/third_party/mindspore/mindspore/ccsrc/minddata/dataset/engine/ |
D | execution_tree.cc | 43 rank_id_ = cfg->rank_id(); in ExecutionTree() 163 if (numa_enable_ && rank_id_ >= 0) { in Launch() 170 RETURN_IF_NOT_OK(NumaBind(handle_, rank_id_)); in Launch()
|
/third_party/mindspore/mindspore/ccsrc/ps/ |
D | ps_context.h | 195 rank_id_(0), in PSContext() 234 uint32_t rank_id_; variable
|
D | util.h | 67 static int64_t rank_id_; variable
|
/third_party/mindspore/mindspore/ccsrc/ps/ps_cache/ |
D | ps_cache_manager.h | 129 void set_rank_id(uint32_t rank_id) { rank_id_ = rank_id; } in set_rank_id() 206 uint32_t rank_id_{0};
|
/third_party/mindspore/mindspore/ccsrc/backend/session/ |
D | gpu_session.cc | 123 rank_id_ = GetRankId(); in Init() 129 json_parser.CopyDumpJsonToDir(rank_id_); in Init() 130 json_parser.CopyMSCfgJsonToDir(rank_id_); in Init() 472 std::string root_dir = json_parser.path() + "/rank_" + std::to_string(rank_id_); in CompileGraphImpl() 715 E2eDump::DumpData(kernel_graph.get(), rank_id_, debugger_.get()); in Dump()
|
/third_party/mindspore/mindspore/ccsrc/minddata/dataset/engine/datasetops/ |
D | device_queue_op.cc | 50 rank_id_ = cfg->rank_id(); // Get the current rank_id in DeviceQueueOp() 52 rank_id_ = rank_id_ % device_count; in DeviceQueueOp() 369 auto ret = cudaSetDevice(rank_id_); in SetThreadDevice()
|