OpenHarmony-v6.0-Release/s

/**
 * Copyright (c) Huawei Technologies Co., Ltd. 2020-2021. All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "utils/kernel_util.h"

#include <algorithm>
#include <map>
#include <string>
#include <vector>

#include "inc/cust_cpu_utils.h"

namespace aicpu {
namespace {
const std::map<Format, std::string> kFormatToStringMap = {
  {FORMAT_NCHW, "NCHW"},
  {FORMAT_NHWC, "NHWC"},
  {FORMAT_ND, "ND"},
  {FORMAT_NC1HWC0, "NC1HWC0"},
  {FORMAT_FRACTAL_Z, "FRACTAL_Z"},
  {FORMAT_NC1C0HWPAD, "NC1C0HWPAD"},
  {FORMAT_NHWC1C0, "NHWC1C0"},
  {FORMAT_FSR_NCHW, "FSR_NCHW"},
  {FORMAT_FRACTAL_DECONV, "FRACTAL_DECONV"},
  {FORMAT_C1HWNC0, "C1HWNC0"},
  {FORMAT_FRACTAL_DECONV_TRANSPOSE, "FRACTAL_DECONV_TRANSPOSE"},
  {FORMAT_FRACTAL_DECONV_SP_STRIDE_TRANS, "FRACTAL_DECONV_SP_STRIDE_TRANS"},
  {FORMAT_NC1HWC0_C04, "NC1HWC0_C04"},
  {FORMAT_FRACTAL_Z_C04, "FRACTAL_Z_C04"},
  {FORMAT_CHWN, "CHWN"},
  {FORMAT_FRACTAL_DECONV_SP_STRIDE8_TRANS, "DECONV_SP_STRIDE8_TRANS"},
  {FORMAT_NC1KHKWHWC0, "NC1KHKWHWC0"},
  {FORMAT_BN_WEIGHT, "BN_WEIGHT"},
  {FORMAT_FILTER_HWCK, "FILTER_HWCK"},
  {FORMAT_HWCN, "HWCN"},
  {FORMAT_HASHTABLE_LOOKUP_LOOKUPS, "LOOKUP_LOOKUPS"},
  {FORMAT_HASHTABLE_LOOKUP_KEYS, "LOOKUP_KEYS"},
  {FORMAT_HASHTABLE_LOOKUP_VALUE, "LOOKUP_VALUE"},
  {FORMAT_HASHTABLE_LOOKUP_OUTPUT, "LOOKUP_OUTPUT"},
  {FORMAT_HASHTABLE_LOOKUP_HITS, "LOOKUP_HITS"},
  {FORMAT_MD, "MD"},
  {FORMAT_NDHWC, "NDHWC"},
  {FORMAT_NCDHW, "NCDHW"},
  {FORMAT_DHWCN, "DHWCN"},
  {FORMAT_DHWNC, "DHWNC"},
  {FORMAT_NDC1HWC0, "NDC1HWC0"},
  {FORMAT_FRACTAL_Z_3D, "FRACTAL_Z_3D"},
  {FORMAT_FRACTAL_Z_3D_TRANSPOSE, "FRACTAL_Z_3D_TRANSPOSE"},
  {FORMAT_C1HWNCoC0, "C1HWNCoC0"},
  {FORMAT_FRACTAL_NZ, "FRACTAL_NZ"},
  {FORMAT_CN, "CN"},
  {FORMAT_NC, "NC"},
  {FORMAT_FRACTAL_ZN_LSTM, "FRACTAL_ZN_LSTM"},
  {FORMAT_FRACTAL_Z_G, "FRACTAL_Z_G"},
  {FORMAT_RESERVED, "FORMAT_RESERVED"},
  {FORMAT_ALL, "ALL"},
  {FORMAT_NULL, "NULL"}};
}  // namespace

std::string FormatToSerialString(CpuKernelContext &ctx, Format format) {
  auto it = kFormatToStringMap.find(static_cast<Format>(GetPrimaryFormat(static_cast<int32_t>(format))));
  if (it != kFormatToStringMap.end()) {
    if (HasSubFormat(static_cast<int32_t>(format))) {
      return it->second + ":" + std::to_string(GetSubFormat(static_cast<int32_t>(format)));
    }
    return it->second;
  } else {
    CUST_KERNEL_LOG_ERROR(ctx, "Format not support [%u]", format);
    return "UNDEFINED";
  }
}

const std::map<std::string, DataType> dtype_maps{{"DT_FLOAT", DT_FLOAT},
                                                 {"DT_FLOAT16", DT_FLOAT16},
                                                 {"DT_INT8", DT_INT8},
                                                 {"DT_INT16", DT_INT16},
                                                 {"DT_UINT16", DT_UINT16},
                                                 {"DT_UINT8", DT_UINT8},
                                                 {"DT_INT32", DT_INT32},
                                                 {"DT_INT64", DT_INT64},
                                                 {"DT_UINT32", DT_UINT32},
                                                 {"DT_UINT64", DT_UINT64},
                                                 {"DT_BOOL", DT_BOOL},
                                                 {"DT_DOUBLE", DT_DOUBLE},
                                                 {"DT_STRING", DT_STRING},
                                                 {"DT_DUAL_SUB_INT8", DT_DUAL_SUB_INT8},
                                                 {"DT_DUAL_SUB_UINT8", DT_DUAL_SUB_UINT8},
                                                 {"DT_COMPLEX64", DT_COMPLEX64},
                                                 {"DT_COMPLEX128", DT_COMPLEX128},
                                                 {"DT_QINT8", DT_QINT8},
                                                 {"DT_QINT16", DT_QINT16},
                                                 {"DT_QINT32", DT_QINT32},
                                                 {"DT_QUINT8", DT_QUINT8},
                                                 {"DT_QUINT16", DT_QUINT16},
                                                 {"DT_RESOURCE", DT_RESOURCE},
                                                 {"DT_STRING_REF", DT_STRING_REF},
                                                 {"DT_DUAL", DT_DUAL},
                                                 {"DT_UNDEFINED", DT_UNDEFINED}};

bool IsEmptyTensor(Tensor *tensor) {
  auto dims = tensor->GetTensorShape()->GetDimSizes();
  if (tensor->GetData() == nullptr) {
    for (uint32_t i = 0; i < dims.size(); i++) {
      if (dims[i] == 0) {
        return true;
      }
    }
  }
  return false;
}

uint32_t NormalMathCheck(CpuKernelContext &ctx) {
  const uint32_t kInputNum = 2;
  const uint32_t kOutputNum = 1;

  if ((ctx.GetInputsSize() != kInputNum) || (ctx.GetOutputsSize() != kOutputNum)) {
    CUST_KERNEL_LOG_ERROR(ctx,
                          "[%s] Input size or Output size is unexpected,"
                          "expected input size [%u], real input size [%u],"
                          "expected output size [%u], real output size [%u]",
                          ctx.GetOpType().c_str(), kInputNum, ctx.GetInputsSize(), kOutputNum, ctx.GetOutputsSize());
    return KERNEL_STATUS_PARAM_INVALID;
  }

  Tensor *input_0 = ctx.Input(kFirstInputIndex);
  CUST_KERNEL_CHECK_NULLPTR(ctx, input_0, KERNEL_STATUS_PARAM_INVALID, "[%s] Get input[0] failed",
                            ctx.GetOpType().c_str());
  Tensor *input_1 = ctx.Input(kSecondInputIndex);
  CUST_KERNEL_CHECK_NULLPTR(ctx, input_1, KERNEL_STATUS_PARAM_INVALID, "[%s] Get input[1] failed",
                            ctx.GetOpType().c_str());

  if (input_0->GetDataType() != input_1->GetDataType()) {
    CUST_KERNEL_LOG_ERROR(ctx,
                          "[%s] dtype of inputs not matched, input[0] data_type is [%d], "
                          "input[1] data_type is [%d]",
                          ctx.GetOpType().c_str(), input_0->GetDataType(), input_1->GetDataType());
    return KERNEL_STATUS_PARAM_INVALID;
  }

  Tensor *output = ctx.Output(kFirstOutputIndex);
  CUST_KERNEL_CHECK_NULLPTR(ctx, output, KERNEL_STATUS_PARAM_INVALID, "[%s] get output failed",
                            ctx.GetOpType().c_str());
  return KERNEL_STATUS_OK;
}

uint32_t NormalCheck(CpuKernelContext &ctx, const uint32_t inputs_num, const uint32_t outputs_num) {
  if (inputs_num != kDynamicInput) {
    CUST_KERNEL_CHECK_FALSE(ctx, (ctx.GetInputsSize() >= inputs_num), KERNEL_STATUS_PARAM_INVALID,
                            "[%s] need [%u] inputs, but got [%u].", ctx.GetOpType().c_str(), inputs_num,
                            ctx.GetInputsSize());
    for (uint32_t i = 0; i < inputs_num; ++i) {
      Tensor *input = ctx.Input(i);
      CUST_KERNEL_CHECK_NULLPTR(ctx, input, KERNEL_STATUS_INNER_ERROR, "[%s] get input[%u] failed.",
                                ctx.GetOpType().c_str(), i);
      auto input_shape = input->GetTensorShape();
      CUST_KERNEL_CHECK_NULLPTR(ctx, input_shape, KERNEL_STATUS_PARAM_INVALID, "%s input[%u] tensor shape is nullptr.",
                                ctx.GetOpType().c_str(), i);
      if (!IsEmptyTensor(input)) {
        auto input_data = input->GetData();
        CUST_KERNEL_CHECK_NULLPTR(ctx, input_data, KERNEL_STATUS_PARAM_INVALID, "%s input[%u] tensor data is nullptr.",
                                  ctx.GetOpType().c_str(), i);
      }
    }
  }

  if (outputs_num != kDynamicOutput) {
    CUST_KERNEL_CHECK_FALSE(ctx, (ctx.GetOutputsSize() == outputs_num), KERNEL_STATUS_PARAM_INVALID,
                            "[%s] need [%u] outputs, but got [%u].", ctx.GetOpType().c_str(), outputs_num,
                            ctx.GetOutputsSize());
    for (uint32_t i = 0; i < outputs_num; ++i) {
      Tensor *output = ctx.Output(i);
      CUST_KERNEL_CHECK_NULLPTR(ctx, output, KERNEL_STATUS_INNER_ERROR, "[%s] get output[%u] failed.",
                                ctx.GetOpType().c_str(), i);
      auto output_shape = output->GetTensorShape();
      CUST_KERNEL_CHECK_NULLPTR(ctx, output_shape, KERNEL_STATUS_PARAM_INVALID,
                                "%s output[%u] tensor shape is nullptr.", ctx.GetOpType().c_str(), i);
      if (!IsEmptyTensor(output)) {
        auto output_data = output->GetData();
        CUST_KERNEL_CHECK_NULLPTR(ctx, output_data, KERNEL_STATUS_PARAM_INVALID,
                                  "%s output[%u] tensor data is nullptr.", ctx.GetOpType().c_str(), i);
      }
    }
  }
  return KERNEL_STATUS_OK;
}

uint32_t NormalCheck(CpuKernelContext &ctx, const uint32_t inputs_num, const uint32_t outputs_num,
                     const std::vector<std::string> &attr_names) {
  CUST_KERNEL_HANDLE_ERROR(ctx, NormalCheck(ctx, inputs_num, outputs_num), "Check Greater params failed.");
  for (auto const &attr_name : attr_names) {
    auto attr = ctx.GetAttr(attr_name);
    CUST_KERNEL_CHECK_NULLPTR(ctx, attr, KERNEL_STATUS_PARAM_INVALID, "%s get attr[%s] is nullptr.",
                              ctx.GetOpType().c_str(), attr_name.c_str());
  }
  return KERNEL_STATUS_OK;
}

bool IsScalar(const std::vector<int64_t> &shape) { return (shape.size() == 0); }

bool IsVector(const std::vector<int64_t> &shape) { return (shape.size() == 1); }

bool IsMatrix(const std::vector<int64_t> &shape) { return (shape.size() == 2); }

bool IsSquareMatrix(const std::vector<int64_t> &shape) { return ((shape.size() == 2) && (shape[0] == shape[1])); }

bool AddrAlignedCheck(const void *addr, uint64_t alignment) {
  return reinterpret_cast<uint64_t>(reinterpret_cast<uintptr_t>(addr)) % alignment == 0;
}

bool IsVectorOrHigher(const std::vector<int64_t> &shape) { return (shape.size() >= 1); }

DataType DType(std::string dtype_str) {
  auto iter = dtype_maps.find(dtype_str);
  if (iter != dtype_maps.end()) {
    return iter->second;
  } else {
    return DT_UNDEFINED;
  }
}

std::string DTypeStr(DataType dtype) {
  auto iter =
    std::find_if(dtype_maps.begin(), dtype_maps.end(),
                 [dtype](const std::map<std::string, DataType>::value_type &kv) { return (kv.second == dtype); });
  if (iter != dtype_maps.end()) {
    return iter->first;
  } else {
    return std::string("DT_UNDEFINED");
  }
}

uint32_t CheckTensorTypeSame(CpuKernelContext &ctx, const std::map<std::string, DataType> &types,
                             const DataType &check_type, const std::string &prim_name) {
  if (types.empty()) {
    CUST_KERNEL_LOG_ERROR(ctx, "Trying to use the function to check a empty types map!");
    return KERNEL_STATUS_PARAM_INVALID;
  }
  for (const auto type : types) {
    auto _type_ = type.second;
    if (_type_ != check_type) {
      CUST_KERNEL_LOG_ERROR(ctx,
                            "For primitive[%s]'s input arguments [%s] type should equal to [%s] , "
                            "but get the real type [%s].",
                            prim_name.c_str(), type.first.c_str(), DTypeStr(check_type).c_str(),
                            DTypeStr(_type_).c_str());
      return KERNEL_STATUS_PARAM_INVALID;
    }
  }
  return KERNEL_STATUS_OK;
}

uint32_t CheckTensorShapeSame(CpuKernelContext &ctx, const std::map<std::string, TensorShapePtr> &shapes,
                              const std::vector<int64_t> &check_shape, const std::string &prim_name) {
  if (shapes.empty()) {
    CUST_KERNEL_LOG_ERROR(ctx, "Trying to use the function to check a empty types map!");
    return KERNEL_STATUS_PARAM_INVALID;
  }
  for (const auto shape : shapes) {
    auto _shape_ptr_ = shape.second;
    CUST_KERNEL_CHECK_NULLPTR(ctx, _shape_ptr_, KERNEL_STATUS_PARAM_INVALID,
                              "For primitive[%s]'s input arguments [%s] TensorShapePtr "
                              "should not be nullptr.",
                              prim_name.c_str(), shape.first.c_str());
    auto _shape_ = _shape_ptr_->GetDimSizes();
    if (!ShapeVectorIsSame(_shape_, check_shape)) {
      CUST_KERNEL_LOG_ERROR(ctx,
                            "For primitive[%s]'s input arguments [%s] shape should equal to (%s) , "
                            "but get the real shape (%s).",
                            prim_name.c_str(), shape.first.c_str(), VectorToString(check_shape).c_str(),
                            VectorToString(_shape_).c_str());
      return KERNEL_STATUS_PARAM_INVALID;
    }
  }
  return KERNEL_STATUS_OK;
}

}  // namespace aicpu