OpenHarmony-v3.2.1-Release/s

/**
 * Copyright 2020-2021 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
#ifndef MINDSPORE_CCSRC_MINDDATA_DATASET_ENGINE_CACHE_CLIENT_H_
#define MINDSPORE_CCSRC_MINDDATA_DATASET_ENGINE_CACHE_CLIENT_H_

#include <atomic>
#include <iostream>
#include <limits>
#include <memory>
#include <map>
#include <mutex>
#include <set>
#include <string>
#include <unordered_map>
#include <utility>
#include <vector>

#include "minddata/dataset/core/config_manager.h"
#ifdef ENABLE_CACHE
#include "minddata/dataset/engine/cache/cache_grpc_client.h"
#else
#include "minddata/dataset/engine/cache/stub/cache_grpc_client.h"
#endif

#include "minddata/dataset/util/lock.h"
#include "minddata/dataset/util/cond_var.h"
#include "minddata/dataset/util/queue_map.h"
#include "minddata/dataset/util/task_manager.h"
#include "minddata/dataset/util/wait_post.h"

namespace mindspore {
namespace dataset {
/// \brief A CacheClient is a bridge between a DatasetOp and a CacheServer. All communications are through
/// a CacheClient. Typical tasks including like creating a cache service, cache a data buffer, restore a previously
/// rows, etc.
class CacheClient {
 public:
  friend class CacheMergeOp;
  friend class CreateCacheRequest;
  friend class CacheRowRequest;
  friend class BatchFetchRequest;
  friend class BatchCacheRowsRequest;

  /// \brief A builder to help creating a CacheClient object
  class Builder {
   public:
    Builder();

    ~Builder() = default;

    /// Setter function to set the session id
    /// \param session_id
    /// \return Builder object itself.
    Builder &SetSessionId(session_id_type session_id) {
      session_id_ = session_id;
      return *this;
    }

    /// Setter function to set the cache memory size
    /// \param cache_mem_sz
    /// \return Builder object itself
    Builder &SetCacheMemSz(uint64_t cache_mem_sz) {
      cache_mem_sz_ = cache_mem_sz;
      return *this;
    }

    /// Setter function to spill attribute
    /// \param spill
    /// Builder object itself
    Builder &SetSpill(bool spill) {
      spill_ = spill;
      return *this;
    }

    /// Setter function to set rpc hostname
    /// \param host
    /// \return Builder object itself
    Builder &SetHostname(std::string host) {
      hostname_ = std::move(host);
      return *this;
    }

    /// Setter function to set tcpip port
    /// \param port
    /// \return Builder object itself.
    Builder &SetPort(int32_t port) {
      port_ = port;
      return *this;
    }

    /// Setter function to set number of async rpc workers
    /// \param num_connections
    /// \return Builder object itself
    Builder &SetNumConnections(int32_t num_connections) {
      num_connections_ = num_connections;
      return *this;
    }

    /// Setter function to set prefetch amount for fetching rows from cache server
    /// \param prefetch_sz
    /// \return Builder object itself
    Builder &SetPrefetchSize(int32_t prefetch_sz) {
      prefetch_size_ = prefetch_sz;
      return *this;
    }

    /// Getter functions
    session_id_type GetSessionId() const { return session_id_; }
    uint64_t GetCacheMemSz() const { return cache_mem_sz_; }
    bool isSpill() const { return spill_; }
    const std::string &GetHostname() const { return hostname_; }
    int32_t GetPort() const { return port_; }
    int32_t GetNumConnections() const { return num_connections_; }
    int32_t GetPrefetchSize() const { return prefetch_size_; }

    Status SanityCheck();

    Status Build(std::shared_ptr<CacheClient> *out);

   private:
    session_id_type session_id_;
    uint64_t cache_mem_sz_;
    bool spill_;
    std::string hostname_;
    int32_t port_;
    int32_t num_connections_;
    int32_t prefetch_size_;
  };

  /// \brief Constructor
  /// \param session_id A user assigned session id for the current pipeline
  /// \param cache_mem_sz Size of the memory set aside for the row caching. 0 for unlimited
  /// \param spill Spill to disk if out of memory
  CacheClient(session_id_type session_id, uint64_t cache_mem_sz, bool spill, std::string hostname, int32_t port,
              int32_t num_connections, int32_t prefetch_size);

  /// \brief Destructor
  ~CacheClient();

  /// \brief Send a TensorRow to the cache server
  /// \param[in] row
  /// \param[out] row_id_from_server Optional. The row id assigned by the server for non-mappable dataset
  /// \return return code
  Status WriteRow(const TensorRow &row, row_id_type *row_id_from_server = nullptr) const;

  /// \brief Fetch a list of rows from the cache server. An empty TensorRow will be returned if there is
  /// any cache miss
  /// \param row_id A vector of row id's
  /// \param out A TensorTable of TensorRows.
  /// \return return code
  Status GetRows(const std::vector<row_id_type> &row_id, TensorTable *out) const;

  /// \brief Create a cache.
  /// \param tree_crc  A crc that was generated during tree prepare phase
  /// \param generate_id Let the cache service generate row id
  /// \return Status object
  Status CreateCache(uint32_t tree_crc, bool generate_id);

  /// \brief Destroy a cache. Like Purge but the cache is deleted and can't be reused.
  /// \return Status object
  Status DestroyCache();

  /// \brief Get the statistics from a cache.
  /// \param[in/out] Pointer to a pre-allocated ServiceStat object
  /// \return Status object
  Status GetStat(CacheServiceStat *);

  /// \brief Get the state of a cache server
  /// \param[in/out] Pointer to a int8_t
  /// \return Status object
  Status GetState(int8_t *);

  /// \brief Cache the schema at the cache server
  /// \param map The unordered map of the schema
  /// \return Status object
  Status CacheSchema(const std::unordered_map<std::string, int32_t> &map);

  /// \brief Fetch the schema from the cache server
  /// \param map Pointer to pre-allocated map object
  /// \return Status object.
  Status FetchSchema(std::unordered_map<std::string, int32_t> *map);

  /// \brief Change the state from build phase to read phase. Applicable to non-mappable dataset only. Only the cache
  /// client that holds cookie can be allowed to make this request
  /// \return Status object
  Status BuildPhaseDone() const;

  /// \brief A print method typically used for debugging
  /// \param out The output stream to write output to
  void Print(std::ostream &out) const;

  /// \brief Stream output operator overload
  /// \return the output stream must be returned
  friend std::ostream &operator<<(std::ostream &out, const CacheClient &cc) {
    cc.Print(out);
    return out;
  }

  /// \brief Every cache server has a cookie which uniquely identifies the CacheClient that creates it.
  /// \return Cookie
  std::string cookie() const { return cookie_; }

  /// \brief Send a request async to the server
  /// \param rq BaseRequest
  /// \return Status object
  Status PushRequest(std::shared_ptr<BaseRequest> rq) const;

  /// \brief If the remote server supports local bypass using shared memory
  /// \return boolean value
  bool SupportLocalClient() const { return local_bypass_; }

  /// \brief Return the base memory address if we attach to any shared memory.
  auto SharedMemoryBaseAddr() const { return comm_->SharedMemoryBaseAddr(); }

  /// Getter functions
  session_id_type session_id() const { return cinfo_.session_id(); }
  uint64_t GetCacheMemSz() const { return cache_mem_sz_; }
  bool isSpill() const { return spill_; }
  int32_t GetNumConnections() const { return num_connections_; }
  int32_t GetPrefetchSize() const { return prefetch_size_; }
  int32_t GetClientId() const { return client_id_; }
  std::string GetHostname() const;
  int32_t GetPort() const;

  /// MergeOp will notify us when the server can't cache any more rows.
  /// We will stop any attempt to fetch any rows that are most likely
  /// not present at the server.
  void ServerRunningOutOfResources();

  /// \brief Check if a row is 100% cache miss at the server by checking the local information
  /// \param key row id to be test
  /// \return true if not at the server
  bool KeyIsCacheMiss(row_id_type key) {
    if (cache_miss_keys_) {
      // Make sure it is fully built even though the pointer is not null
      Status rc = cache_miss_keys_wp_.Wait();
      if (rc.IsOk()) {
        return cache_miss_keys_->KeyIsCacheMiss(key);
      }
    }
    return false;
  }

  /// \brief Serialize a Tensor into the async buffer.
  Status AsyncWriteRow(const TensorRow &row);

  // Default size of the async write buffer
  constexpr static int64_t kAsyncBufferSize = 16 * 1048576L;  // 16M
  constexpr static int32_t kNumAsyncBuffer = 3;

  /// Force a final flush to the cache server. Must be called when receiving eoe.
  Status FlushAsyncWriteBuffer() {
    if (async_buffer_stream_) {
      return async_buffer_stream_->SyncFlush(AsyncBufferStream::AsyncFlushFlag::kFlushBlocking);
    }
    return Status::OK();
  }

 private:
  mutable RWLock mux_;
  uint64_t cache_mem_sz_;
  bool spill_;
  // The session_id_ and cache_crc_ work together to uniquely identify this particular cache and allow
  // sharing of the cache.
  CacheClientInfo cinfo_;
  // The server_connection_id_ is the actual id we use for operations after the cache is built
  connection_id_type server_connection_id_;
  // Some magic cookie/id returned from the cache server.
  std::string cookie_;
  int32_t client_id_;
  std::vector<int32_t> cpu_list_;
  // Comm layer
  bool local_bypass_;
  int32_t num_connections_;
  int32_t prefetch_size_;
  mutable std::shared_ptr<CacheClientGreeter> comm_;
  std::atomic<bool> fetch_all_keys_;
  WaitPost cache_miss_keys_wp_;
  /// A structure shared by all the prefetchers to know what keys are missing at the server.
  class CacheMissKeys {
   public:
    explicit CacheMissKeys(const std::vector<row_id_type> &v);
    ~CacheMissKeys() = default;
    /// This checks if a key is missing.
    /// \param key
    /// \return true if definitely a key miss
    bool KeyIsCacheMiss(row_id_type key);

   private:
    row_id_type min_;
    row_id_type max_;
    std::set<row_id_type> gap_;
  };
  std::unique_ptr<CacheMissKeys> cache_miss_keys_;

  /// A data stream of back-to-back serialized tensor rows.
  class AsyncBufferStream {
   public:
    AsyncBufferStream();
    ~AsyncBufferStream();

    /// \brief Initialize an Ascyn write buffer
    Status Init(CacheClient *cc);

    /// A worker will call the API AsyncWrite to put a TensorRow into the data stream.
    /// A background thread will stream the data to the cache server.
    /// The result of calling AsyncWrite is not immediate known or it can be the last
    /// result of some previous flush.
    /// \note Need to call SyncFlush to do the final flush.
    Status AsyncWrite(const TensorRow &row);
    enum class AsyncFlushFlag : int8_t { kFlushNone = 0, kFlushBlocking = 1, kCallerHasXLock = 1u << 2 };
    Status SyncFlush(AsyncFlushFlag flag);

    /// This maps a physical shared memory to the data stream.
    class AsyncWriter {
     public:
      friend class AsyncBufferStream;
      Status Write(int64_t sz, const std::vector<ReadableSlice> &v);

     private:
      std::shared_ptr<BatchCacheRowsRequest> rq;
      void *buffer_;
      int32_t num_ele_;      // How many tensor rows in this buffer
      int64_t bytes_avail_;  // Number of bytes remain
    };

    /// \brief Release the shared memory during shutdown
    /// /note but needs comm layer to be alive.
    Status ReleaseBuffer();
    /// \brief Reset the AsyncBufferStream into its initial state
    /// \return Status object
    Status Reset();

   private:
    Status flush_rc_;
    std::mutex mux_;
    TaskGroup vg_;
    CacheClient *cc_;
    int64_t offset_addr_;
    AsyncWriter buf_arr_[kNumAsyncBuffer];
    int32_t cur_;
  };
  std::shared_ptr<AsyncBufferStream> async_buffer_stream_;
};
}  // namespace dataset
}  // namespace mindspore

#endif  // MINDSPORE_CCSRC_MINDDATA_DATASET_ENGINE_CACHE_CLIENT_H_