Home
last modified time | relevance | path

Searched refs:rank_id_ (Results 1 – 25 of 35) sorted by relevance

12

/third_party/mindspore/mindspore/ccsrc/runtime/device/gpu/distribution/
Dmpi_wrapper.cc26 MPIWrapper::MPIWrapper() : rank_id_(0), rank_size_(0), local_rank_id_(0) { Init(); } in MPIWrapper()
61 if (rank_id_ == ranks[0]) { in CreateCommGroup()
67 int global_rank[1] = {rank_id_}; in CreateCommGroup()
114 CHECK_RET(MPI_Comm_rank(MPI_COMM_WORLD, &rank_id_), MPI_SUCCESS, "Failed to init mpi rank id."); in Init()
122 if (rank_id_ == 0) { in Init()
132 NcclGroupInfo world_group = {rank_size_, rank_id_, unique_id, nullptr, world_group_ranks}; in Init()
144 CHECK_RET((rank_id_ < kRankSize), true, "The rank id is not less than rank size."); in AssignLocalRankID()
145 all_host_hashs[rank_id_] = host_hash; in AssignLocalRankID()
149 if (global_rank == rank_id_) { in AssignLocalRankID()
152 if (all_host_hashs[global_rank] == all_host_hashs[rank_id_]) { in AssignLocalRankID()
Dmpi_wrapper.h51 int rank_id_; variable
/third_party/mindspore/mindspore/ccsrc/runtime/device/cpu/mpi/
Dmpi_adapter.cc122 auto ret = MPI_Comm_rank(MPI_COMM_WORLD, &rank_id_); in Init()
129 RAISE_EXCEPTION_WITH_PARAM("Failed to init mpi rank size!rankid:", rank_id_); in Init()
139 if (std::find(ranks.begin(), ranks.end(), rank_id_) == ranks.end()) { in AddGroup()
140 …ISE_EXCEPTION_WITH_PARAM("local rankid does not in the input rank group!local rank id:", rank_id_); in AddGroup()
156 RAISE_EXCEPTION_WITH_PARAM("create mpi group fail!rankid:", rank_id_); in AddGroup()
172 RAISE_EXCEPTION_WITH_PARAM("Get mpi group fail!rankid:", rank_id_); in ReduceScatter()
177 RAISE_EXCEPTION_WITH_PARAM("create mpi comm fail!rankid:", rank_id_); in ReduceScatter()
201 int scatter_index = GetScatterIndex(rank_id_, ranks_group); in ReduceScatterOverwriteInput()
204 RAISE_EXCEPTION_WITH_PARAM("Get mpi group fail!rankid:", rank_id_); in ReduceScatterOverwriteInput()
209 RAISE_EXCEPTION_WITH_PARAM("create mpi comm fail!rankid:", rank_id_); in ReduceScatterOverwriteInput()
[all …]
Dmpi_adapter.h35 FUNC_EXPORT int GetRankId() const { return rank_id_; } in GetRankId()
53 int rank_id_{-1};
/third_party/mindspore/mindspore/ccsrc/runtime/device/ascend/distribute/
Dmpi_collective_group.cc24 MPICollective::MPICollective() : mpi_inited_(false), rank_id_(0), local_rank_id_(0), rank_size_(0) … in MPICollective()
65 CHECK_RET(MPI_Comm_rank(MPI_COMM_WORLD, &rank_id_), MPI_SUCCESS, "Failed to init mpi rank id!"); in Init()
69 group_info_["hccl_world_group"] = {rank_id_, rank_size_}; in Init()
81 if (static_cast<unsigned int>(rank_id_) == ranks[0]) { in CreateCommGroup()
96 int global_rank[1] = {rank_id_}; in CreateCommGroup()
117 all_host_hashs[rank_id_] = host_hash; in AssignLocalRankID()
121 if (global_rank == rank_id_) { in AssignLocalRankID()
124 if (all_host_hashs[global_rank] == all_host_hashs[rank_id_]) { in AssignLocalRankID()
Dmpi_collective_group.h54 int rank_id_; variable
/third_party/mindspore/mindspore/ccsrc/ps/core/
Dnode_manager.cc41 rank_id = registered_nodes_info_[node_id].rank_id_; in NextRankId()
56 …MS_LOG(INFO) << "The server node id:" << item.first << " rank id:" << item.second.rank_id_ << " is… in NextRankId()
57 rank_id = item.second.rank_id_; in NextRankId()
80 node_info.rank_id_ = rank_id; in NextRankId()
96 rank_id = item.second.rank_id_; in NextRankId()
119 node_info.rank_id_ = rank_id; in NextRankId()
141 servers_meta.set_rank_id(it->second.rank_id_); in FetchServersMeta()
154 servers_meta.set_rank_id(it->second.rank_id_); in FetchAllNodesMeta()
266 server_rank_ids.push_back(registered_nodes_info_[item].rank_id_); in ResetMetadata()
283 …ond.node_role_ == NodeRole::SERVER && item.second.is_alive == false && item.second.rank_id_ == 0) { in IsWorkerOrServer0()
Dinstance_manager.cc30 message_meta->set_rank_id(node_info.rank_id_); in NewInstanceAsync()
49 message_meta->set_rank_id(node_info.rank_id_); in QueryInstanceAsync()
69 message_meta->set_rank_id(node_info.rank_id_); in EnableFLSAsync()
89 message_meta->set_rank_id(node_info.rank_id_); in DisableFLSAsync()
Dnode_info.h39 …NodeInfo() : ip_(""), port_(0), node_role_(NodeRole::SCHEDULER), rank_id_(UINT32_MAX), is_alive(fa… in NodeInfo()
49 uint32_t rank_id_; member
Dabstract_node.cc30 message_meta->set_rank_id(node_info_.rank_id_); in Register()
79 message_meta->set_rank_id(node_info_.rank_id_); in Broadcast()
192 message_meta->set_rank_id(node_info_.rank_id_); in Send()
223 message_meta->set_rank_id(node_info_.rank_id_); in Send()
266 message_meta->set_rank_id(node_info_.rank_id_); in Send()
316 message_meta->set_rank_id(node_info_.rank_id_); in Send()
345 message_meta->set_rank_id(node_info_.rank_id_); in CollectiveSendAsync()
457 meta->set_rank_id(node_info_.rank_id_); in Response()
507 … << ", the node id:" << node_info_.node_id_ << ", the node rank id:" << node_info_.rank_id_ in StartHeartbeatTimer()
585 info.rank_id_ = it.rank_id(); in ProcessHeartbeatResp()
[all …]
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/fl/
Dstart_fl_job_kernel.h75 rank_id_ = fl::worker::FLWorker::GetInstance().rank_id(); in Init()
76 if (rank_id_ == UINT32_MAX) { in Init()
80 target_server_rank_ = rank_id_ % server_num_; in Init()
114 uint32_t rank_id_; variable
Dget_model_kernel.h105 rank_id_ = fl::worker::FLWorker::GetInstance().rank_id(); in Init()
106 if (rank_id_ == UINT32_MAX) { in Init()
110 target_server_rank_ = rank_id_ % server_num_; in Init()
152 uint32_t rank_id_; variable
Dupdate_model_kernel.h87 rank_id_ = fl::worker::FLWorker::GetInstance().rank_id(); in Init()
88 if (rank_id_ == UINT32_MAX) { in Init()
92 target_server_rank_ = rank_id_ % server_num_; in Init()
160 uint32_t rank_id_; variable
/third_party/mindspore/mindspore/ccsrc/minddata/dataset/core/
Dconfig_manager.cc40 rank_id_(kCfgDefaultRankId), in ConfigManager()
144 if (rank_id_ == kCfgDefaultRankId) rank_id_ = rank_id; in set_rank_id()
Dconfig_manager.h163 int32_t rank_id() const { return rank_id_; } in rank_id()
249 int32_t rank_id_; variable
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/ps/
Dpserver_kernel.h31 : rank_id_(rank_id), pserver_num_(pserver_num), worker_num_(worker_num) {} in PServerKernel()
51 size_t rank_id_; variable
Dpserver_kernel.cc28 …LongToSize(Util::LocalShard(SizeToLong((*shape)[IntToSize(axis)]), SizeToLong(rank_id_), SizeToLon… in Shard()
/third_party/mindspore/mindspore/ccsrc/fl/worker/
Dfl_worker.h102 rank_id_(UINT32_MAX), in FLWorker()
134 uint32_t rank_id_; variable
Dfl_worker.cc76 rank_id_ = worker_node_->rank_id(); in Run()
154 uint32_t FLWorker::rank_id() const { return rank_id_; } in rank_id()
180 std::string FLWorker::fl_id() const { return std::to_string(rank_id_); } in fl_id()
/third_party/mindspore/mindspore/ccsrc/minddata/dataset/engine/
Dexecution_tree.cc43 rank_id_ = cfg->rank_id(); in ExecutionTree()
163 if (numa_enable_ && rank_id_ >= 0) { in Launch()
170 RETURN_IF_NOT_OK(NumaBind(handle_, rank_id_)); in Launch()
/third_party/mindspore/mindspore/ccsrc/ps/
Dps_context.h195 rank_id_(0), in PSContext()
234 uint32_t rank_id_; variable
Dutil.h67 static int64_t rank_id_; variable
/third_party/mindspore/mindspore/ccsrc/ps/ps_cache/
Dps_cache_manager.h129 void set_rank_id(uint32_t rank_id) { rank_id_ = rank_id; } in set_rank_id()
206 uint32_t rank_id_{0};
/third_party/mindspore/mindspore/ccsrc/backend/session/
Dgpu_session.cc123 rank_id_ = GetRankId(); in Init()
129 json_parser.CopyDumpJsonToDir(rank_id_); in Init()
130 json_parser.CopyMSCfgJsonToDir(rank_id_); in Init()
472 std::string root_dir = json_parser.path() + "/rank_" + std::to_string(rank_id_); in CompileGraphImpl()
715 E2eDump::DumpData(kernel_graph.get(), rank_id_, debugger_.get()); in Dump()
/third_party/mindspore/mindspore/ccsrc/minddata/dataset/engine/datasetops/
Ddevice_queue_op.cc50 rank_id_ = cfg->rank_id(); // Get the current rank_id in DeviceQueueOp()
52 rank_id_ = rank_id_ % device_count; in DeviceQueueOp()
369 auto ret = cudaSetDevice(rank_id_); in SetThreadDevice()

12