OpenHarmony-v5.1.0-Release/s

/**
 * Copyright 2022 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#ifndef MINDSPORE_LITE_SRC_LITERT_DELEGATE_NNAPI_NNAPI_DELEGATE_H_
#define MINDSPORE_LITE_SRC_LITERT_DELEGATE_NNAPI_NNAPI_DELEGATE_H_

#include <string>
#include <memory>
#include <vector>
#include <queue>
#include <unordered_map>
#include <utility>
#include "include/api/delegate.h"
#include "src/litert/delegate/nnapi/nnapi_subgraph.h"
#include "src/litert/delegate/nnapi/op/nnapi_op.h"

namespace mindspore {
namespace lite {
class NNAPIDelegate : public Delegate {
 public:
  NNAPIDelegate() : Delegate() {}
  explicit NNAPIDelegate(bool relax_fp32_to_fp16, bool only_use_acc_device, bool disable_cpu_device,
                         const std::vector<std::string> &specified_devices)
      : Delegate(),
        relax_fp32_to_fp16_(relax_fp32_to_fp16),
        only_use_acc_device_(only_use_acc_device),
        disable_cpu_device_(disable_cpu_device),
        specified_devices_(std::move(specified_devices)) {}

  ~NNAPIDelegate() override{};

  Status Init() override;

  Status Build(DelegateModel<schema::Primitive> *model) override;

  void ReplaceNodes(const std::shared_ptr<LiteDelegateGraph> &graph) override;

 private:
  template <typename T>
  STATUS FindReadyKernels(std::vector<T *> *kernels, std::vector<T *> *ready_kernels) {
    MS_ASSERT(kernels != nullptr && ready_kernels != nullptr);
    std::queue<T *> tmp_kernels;
    std::vector<mindspore::MSTensor> visited_tensor;

    std::function<bool(T *)> is_kernel_ready = [&visited_tensor](T *kernel) {
      return std::all_of(kernel->inputs().begin(), kernel->inputs().end(), [&visited_tensor](MSTensor input) {
        return input.IsConst() ||
               std::find(visited_tensor.begin(), visited_tensor.end(), input) != visited_tensor.end();
      });
    };

    // initialize the visited_tensor map.
    for (const auto &input : inputs_) {
      visited_tensor.push_back(input);
    }
    for (auto ready_kernel : sorted_kernels_) {
      for (const auto &output : ready_kernel->outputs()) {
        visited_tensor.push_back(output);
      }
    }
    for (auto kernel : *kernels) {
      MS_CHECK_TRUE_RET(kernel != nullptr, RET_ERROR);
      if (is_kernel_ready(kernel)) {
        tmp_kernels.push(kernel);
        ready_kernels->push_back(kernel);
        kernels->erase(std::find(kernels->begin(), kernels->end(), kernel));
        break;
      }
    }

    while (!tmp_kernels.empty()) {
      auto tmp_kernel = tmp_kernels.front();
      tmp_kernels.pop();
      for (const auto &output : tmp_kernel->outputs()) {
        visited_tensor.push_back(output);
      }
      for (auto itr = kernels->begin(); itr != kernels->end();) {
        if (is_kernel_ready(*itr)) {
          tmp_kernels.push(*itr);
          ready_kernels->push_back(*itr);
          kernels->erase(itr);
        } else {
          itr++;
        }
      }
    }
    return RET_OK;
  }

  NNAPISubGraph *CreateNNAPISubGraph(DelegateModel<schema::Primitive> *model, std::vector<NNAPIOp *> *condidate_ops);

 private:
  bool relax_fp32_to_fp16_ = true;
  bool only_use_acc_device_ = false;
  bool disable_cpu_device_ = false;
  std::vector<std::string> specified_devices_;

  std::vector<mindspore::MSTensor> inputs_;
  std::vector<kernel::Kernel *> sorted_kernels_;
  std::vector<kernel::Kernel *> remained_kernels_;
  std::vector<NNAPISubGraph *> nnapi_kernels_;
  std::unordered_map<schema::PrimitiveType, NNAPIGetOp> op_func_lists_;
  std::vector<ANeuralNetworksDevice *> devices_;
};
}  // namespace lite
}  // namespace mindspore

#endif  // MINDSPORE_LITE_SRC_LITERT_DELEGATE_NNAPI_NNAPI_DELEGATE_H_