OpenHarmony-v6.0-Release/s

/**
 * Copyright 2022 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "plugin/device/cpu/kernel/set_size_cpu_kernel.h"
#include <algorithm>
#include <unordered_set>
#include "plugin/device/cpu/hal/device/cpu_device_address.h"
#include "mindspore/core/ops/set_size.h"

namespace mindspore {
namespace kernel {
bool SetSizeCpuKernelMod::Init(const std::vector<KernelTensor *> &inputs, const std::vector<KernelTensor *> &outputs) {
  constexpr size_t input_num = 3;
  constexpr size_t output_num = 1;
  CHECK_KERNEL_INPUTS_NUM(inputs.size(), input_num, kernel_name_);
  CHECK_KERNEL_OUTPUTS_NUM(outputs.size(), output_num, kernel_name_);
  validate_indices_ = GetValue<bool>(primitive_->GetAttr(ops::kValidateIndices));

  return MatchKernelFunc(kernel_name_, inputs, outputs);
}

int SetSizeCpuKernelMod::Resize(const std::vector<KernelTensor *> &inputs, const std::vector<KernelTensor *> &outputs) {
  if (auto ret = KernelMod::Resize(inputs, outputs); ret != KRET_OK) {
    return ret;
  }
  auto values_shape = inputs[kIndex1]->GetShapeVector();
  shape_ = inputs[kIndex2]->GetShapeVector();
  values_size_ = static_cast<size_t>(values_shape[0]);
  output_shape_ = outputs[kIndex0]->GetShapeVector();
  dims_ = shape_[0];
  return KRET_OK;
}

bool SetSizeCpuKernelMod::IndicesValid(int64_t n, const std::vector<kernel::KernelTensor *> &inputs) const {
  bool valid = true;
  bool different = false;
  bool increasing = true;
  const auto *indices_t = static_cast<int64_t *>(inputs[kIndex0]->device_ptr());
  const auto *shape_t = static_cast<int64_t *>(inputs[kIndex2]->device_ptr());
  for (int64_t di = 0; di < dims_; ++di) {
    if (indices_t[(n * dims_) + di] < 0 || indices_t[(n * dims_) + di] >= shape_t[di]) {
      valid = false;
      break;
    }
    if (n != 0) {
      int64_t diff = indices_t[(n * dims_) + di] - indices_t[((n - 1) * dims_) + di];
      if (diff > 0) {
        different = true;
      }
      if (!different && diff < 0) {
        increasing = false;
        break;
      }
    }
  }
  if (n == 0) {
    different = true;
  }
  if (!valid) {
    MS_EXCEPTION(ValueError) << "For '" << kernel_name_ << "', indices is out of bounds, index=" << n << ".";
    return false;
  }
  if (!increasing) {
    MS_EXCEPTION(ValueError) << "For '" << kernel_name_ << "', indices is out of order, index=" << n << ".";
    return false;
  }
  if (!different) {
    MS_EXCEPTION(ValueError) << "For '" << kernel_name_ << "', indices is repeated, index=" << n << ".";
    return false;
  }
  return true;
}

template <typename T>
bool SetSizeCpuKernelMod::LaunchKernel(const std::vector<kernel::KernelTensor *> &inputs,
                                       const std::vector<kernel::KernelTensor *> &,
                                       const std::vector<kernel::KernelTensor *> &outputs) {
  if (outputs[0]->size() == 0) {
    MS_LOG(WARNING) << "For '" << kernel_name_ << "', output memory size should be greater than 0, but got 0.";
    return true;
  }
  auto ret = memset_s(outputs[0]->device_ptr(), outputs[0]->size(), 0, outputs[0]->size());
  if (ret != EOK) {
    MS_LOG(EXCEPTION) << "For '" << kernel_name_ << "', memset output failed. Error no: " << ret << ".";
  }
  for (unsigned int i = 0; i < values_size_ && validate_indices_; ++i) {
    if (!IndicesValid(i, inputs)) {
      return false;
    }
  }

  auto output_t = static_cast<int32_t *>(outputs[0]->device_ptr());
  auto indices_t = static_cast<int64_t *>(inputs[0]->device_ptr());
  auto vals_t = static_cast<T *>(inputs[1]->device_ptr());
  auto vals_num = values_size_;
  std::vector<int64_t> strides(dims_ - 1);
  auto shape_t = static_cast<int64_t *>(inputs[2]->device_ptr());
  if (dims_ > 1) {
    int t = 2;
    strides[dims_ - t] = 1;
  }
  for (int32_t d = dims_ - 3; d >= 0; --d) {
    strides[d] = strides[d + 1] * shape_t[d + 1];
  }

  int32_t output_size = 1;
  for (int32_t d = 0; d < dims_ - 1; ++d) {
    output_size = output_size * shape_t[d];
  }
  std::vector<std::unordered_set<T>> all_values(output_size);
  for (unsigned int n = 0; n < vals_num; ++n) {
    int64_t ix = 0;
    for (int d = 0; d < dims_ - 1; ++d) {
      const int64_t ix_n_d = indices_t[SizeToLong(n) * dims_ + d];
      ix += strides[d] * ix_n_d;
    }
    all_values[ix].insert(*(vals_t + n));
  }
  for (int i = 0; i < output_size; ++i) {
    output_t[i] = SizeToLong(all_values[i].size());
  }
  return true;
}

const std::vector<std::pair<KernelAttr, SetSizeCpuKernelMod::KernelRunFunc>> &SetSizeCpuKernelMod::GetFuncList() const {
  static const std::vector<std::pair<KernelAttr, SetSizeCpuKernelMod::KernelRunFunc>> func_list = {
    {KernelAttr()
       .AddInputAttr(kNumberTypeInt64)
       .AddInputAttr(kNumberTypeInt8)
       .AddInputAttr(kNumberTypeInt64)
       .AddOutputAttr(kNumberTypeInt32),
     &SetSizeCpuKernelMod::LaunchKernel<int8_t>},
    {KernelAttr()
       .AddInputAttr(kNumberTypeInt64)
       .AddInputAttr(kNumberTypeInt16)
       .AddInputAttr(kNumberTypeInt64)
       .AddOutputAttr(kNumberTypeInt32),
     &SetSizeCpuKernelMod::LaunchKernel<int16_t>},
    {KernelAttr()
       .AddInputAttr(kNumberTypeInt64)
       .AddInputAttr(kNumberTypeInt32)
       .AddInputAttr(kNumberTypeInt64)
       .AddOutputAttr(kNumberTypeInt32),
     &SetSizeCpuKernelMod::LaunchKernel<int32_t>},
    {KernelAttr()
       .AddInputAttr(kNumberTypeInt64)
       .AddInputAttr(kNumberTypeInt64)
       .AddInputAttr(kNumberTypeInt64)
       .AddOutputAttr(kNumberTypeInt32),
     &SetSizeCpuKernelMod::LaunchKernel<int64_t>},
    {KernelAttr()
       .AddInputAttr(kNumberTypeInt64)
       .AddInputAttr(kNumberTypeUInt8)
       .AddInputAttr(kNumberTypeInt64)
       .AddOutputAttr(kNumberTypeInt32),
     &SetSizeCpuKernelMod::LaunchKernel<uint8_t>},
    {KernelAttr()
       .AddInputAttr(kNumberTypeInt64)
       .AddInputAttr(kNumberTypeUInt16)
       .AddInputAttr(kNumberTypeInt64)
       .AddOutputAttr(kNumberTypeInt32),
     &SetSizeCpuKernelMod::LaunchKernel<uint16_t>},
  };
  return func_list;
}

MS_KERNEL_FACTORY_REG(NativeCpuKernelMod, SetSize, SetSizeCpuKernelMod);
}  // namespace kernel
}  // namespace mindspore