Searched refs:num_subdivs (Results 1 – 6 of 6) sorted by relevance
/external/tensorflow/tensorflow/core/common_runtime/ |
D | ring_alg.cc | 140 int num_subdivs = 0; in GenerateSubdivsInCollectiveParams() local 145 ++num_subdivs; in GenerateSubdivsInCollectiveParams() 146 int num_chunks = col_params->group.group_size * num_subdivs; in GenerateSubdivsInCollectiveParams() 148 VLOG(2) << "num_subdivs " << num_subdivs << " num_chunks " << num_chunks in GenerateSubdivsInCollectiveParams() 150 } while (chunk_size > kMaxChunkSizeBytes && num_subdivs < kMaxNumSubdivs); in GenerateSubdivsInCollectiveParams() 151 if (num_subdivs <= 0) { in GenerateSubdivsInCollectiveParams() 152 return errors::Internal("Unexpected num_subdivs ", num_subdivs, " in ", in GenerateSubdivsInCollectiveParams() 156 int subdiv_stride = kAvgDevPerTask / num_subdivs; in GenerateSubdivsInCollectiveParams() 158 col_params->instance.impl_details.subdiv_offsets.reserve(num_subdivs); in GenerateSubdivsInCollectiveParams() 159 for (int sdi = 0; sdi < num_subdivs; ++sdi) { in GenerateSubdivsInCollectiveParams() [all …]
|
D | ring_gatherer_test.cc | 49 int num_subdivs, int fail_after) { in Init() argument 56 rank, num_subdivs, dtype, shape, test_env_.get())); in Init() 80 int num_devices, int num_subdivs, int tensor_len, in RunTest() argument 83 device_type, num_subdivs, fail_after); in RunTest() 124 DeviceInstance(int rank, int num_subdivs, DataType dtype, in DeviceInstance() argument 129 if (num_subdivs > 0) { in DeviceInstance() 132 num_subdivs); in DeviceInstance()
|
D | ring_reducer_test.cc | 86 int num_subdivs, int fail_after) { in Init() argument 93 rank, num_subdivs, dtype, shape, test_env_.get())); in Init() 117 int num_devices, int num_subdivs, int tensor_len, in RunTest() argument 120 device_type, num_subdivs, fail_after); in RunTest() 159 DeviceInstance(int rank, int num_subdivs, DataType dtype, in DeviceInstance() argument 164 if (num_subdivs > 0) { in DeviceInstance() 167 num_subdivs); in DeviceInstance() 283 int num_subdivs = 2; in TEST_F() local 284 int num_chunks = kNumDevs * num_subdivs; in TEST_F()
|
D | hierarchical_tree_broadcaster.cc | 114 int num_subdivs = num_tasks + (num_tasks > 1 ? 1 : 0); in InitializeCollectiveParams() local 118 col_params->instance.impl_details.subdiv_permutations.resize(num_subdivs); in InitializeCollectiveParams() 119 col_params->subdiv_rank.reserve(num_subdivs); in InitializeCollectiveParams() 120 col_params->instance.impl_details.subdiv_source_rank.reserve(num_subdivs); in InitializeCollectiveParams() 180 for (int sri = 0; sri < num_subdivs; sri++) { in InitializeCollectiveParams() 292 int num_subdivs = static_cast<int>(col_params_->subdiv_rank.size()); in RunTree() local 298 for (int si = 0; si < num_subdivs; si++) { in RunTree() 367 if (status_.ok() && is_source_ && (1 == num_subdivs || 0 != si)) { in RunTree()
|
D | collective_test_util.cc | 252 int num_subdivs) { in GenerateEvenSubdivOffsets() argument 254 offsets.reserve(num_subdivs); in GenerateEvenSubdivOffsets() 255 int subdiv_stride = num_devices_per_worker / num_subdivs; in GenerateEvenSubdivOffsets() 256 for (int sdi = 0; sdi < num_subdivs; ++sdi) { in GenerateEvenSubdivOffsets()
|
D | collective_test_util.h | 98 int num_subdivs);
|