1 /* Copyright 2018 The TensorFlow Authors. All Rights Reserved. 2 3 Licensed under the Apache License, Version 2.0 (the "License"); 4 you may not use this file except in compliance with the License. 5 You may obtain a copy of the License at 6 7 http://www.apache.org/licenses/LICENSE-2.0 8 9 Unless required by applicable law or agreed to in writing, software 10 distributed under the License is distributed on an "AS IS" BASIS, 11 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 See the License for the specific language governing permissions and 13 limitations under the License. 14 ==============================================================================*/ 15 #ifndef TENSORFLOW_CORE_DISTRIBUTED_RUNTIME_DEVICE_RESOLVER_DISTRIBUTED_H_ 16 #define TENSORFLOW_CORE_DISTRIBUTED_RUNTIME_DEVICE_RESOLVER_DISTRIBUTED_H_ 17 18 #include <string> 19 #include <vector> 20 21 #include "tensorflow/core/framework/collective.h" 22 #include "tensorflow/core/framework/device_attributes.pb.h" 23 #include "tensorflow/core/lib/gtl/flatmap.h" 24 25 namespace tensorflow { 26 class DeviceMgr; 27 class WorkerCacheInterface; 28 29 class DeviceResolverDistributed : public DeviceResolverInterface { 30 public: 31 DeviceResolverDistributed(const DeviceMgr* dev_mgr, 32 WorkerCacheInterface* worker_cache, 33 const string& task_name); 34 ~DeviceResolverDistributed()35 virtual ~DeviceResolverDistributed() {} 36 37 void GetDeviceLocalitiesAsync(const CollInstanceParams& inst_params, 38 std::vector<DeviceLocality>* localities, 39 const StatusCallback& done) override; 40 41 void GetLocalityAsync(const string& device, const string& task, 42 DeviceLocality* locality, 43 const StatusCallback& done) override; 44 45 void ClearTask(const string& task) override; 46 47 protected: 48 // Loads attr_table_ with device attributes retrieved from remote task. 49 void RefreshRemoteAttributes(const string& device, const string& task, 50 const StatusCallback& done) LOCKS_EXCLUDED(mu_); 51 52 // Subroutine used by GetDeviceLocalitiesAsync. Recursively extends 53 // *localities with DeviceLocality of the corresponding device named 54 // by inst_params.instance.device_names. 55 void GetDeviceLocalitiesRecursive(const CollInstanceParams& inst_params, 56 std::vector<DeviceLocality>* localities, 57 const StatusCallback& done); 58 59 const DeviceMgr* dev_mgr_; // Not owned 60 WorkerCacheInterface* worker_cache_; // Not owned 61 const string task_name_; 62 mutex mu_; 63 gtl::FlatMap<string, DeviceAttributes> attr_table_ GUARDED_BY(mu_); 64 }; 65 66 } // namespace tensorflow 67 #endif // TENSORFLOW_CORE_DISTRIBUTED_RUNTIME_DEVICE_RESOLVER_DISTRIBUTED_H_ 68