OpenHarmony-v3.2-Release/s

/**
 * Copyright 2021 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "coder/generator/component/const_blocks/benchmark.h"

namespace mindspore::lite::micro {
const char benchmark_source[] = R"RAW(
/**
 * Copyright 2021 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include <iostream>
#include <string>
#include <cstring>

#include "include/lite_session.h"
#include "include/ms_tensor.h"
#include "include/errorcode.h"

#include "load_input.h"
#include "calib_output.h"

using namespace mindspore;

void usage() {
  printf(
    "-- mindspore benchmark params usage:\n"
    "args[0]: executable file\n"
    "args[1]: inputs binary file\n"
    "args[2]: model weight binary file\n"
    "args[3]: loop count for performance test\n"
    "args[4]: calibration file\n"
    "args[5]: runtime thread num\n"
    "args[6]: runtime thread bind mode\n\n");
}

uint64_t GetTimeUs() {
  const int USEC = 1000000;
  const int MSEC = 1000;
  struct timespec ts = {0, 0};
  if (clock_gettime(CLOCK_MONOTONIC, &ts) != 0) {
    return 0;
  }
  uint64_t retval = (uint64_t)((ts.tv_sec * USEC) + (ts.tv_nsec / MSEC));
  return retval;
}

template <typename T>
void PrintData(void *data, size_t data_number) {
  if (data == nullptr) {
    return;
  }
  auto casted_data = static_cast<T *>(data);
  for (size_t i = 0; i < 10 && i < data_number; i++) {
    printf("%s, ", std::to_string(casted_data[i]).c_str());
  }
  printf("\n");
}

void TensorToString(tensor::MSTensor *tensor) {
  printf("name: %s, ", tensor->tensor_name().c_str());
  printf("DataType: %d, ", tensor->data_type());
  printf("Elements: %d, ", tensor->ElementsNum());
  printf("Shape: [");
  for (auto &dim : tensor->shape()) {
    printf("%d ", dim);
  }
  printf("], Data: \n");
  switch (tensor->data_type()) {
    case kNumberTypeFloat32: {
      PrintData<float>(tensor->MutableData(), tensor->ElementsNum());
    } break;
    case kNumberTypeFloat16: {
      PrintData<int16_t>(tensor->MutableData(), tensor->ElementsNum());
    } break;
    case kNumberTypeInt32: {
      PrintData<int32_t>(tensor->MutableData(), tensor->ElementsNum());
    } break;
    case kNumberTypeInt16: {
      PrintData<int16_t>(tensor->MutableData(), tensor->ElementsNum());
    } break;
    case kNumberTypeInt8: {
      PrintData<int8_t>(tensor->MutableData(), tensor->ElementsNum());
    } break;
    case kNumberTypeUInt8: {
      PrintData<uint8_t>(tensor->MutableData(), tensor->ElementsNum());
    } break;
    default:
      std::cout << "Unsupported data type to print" << std::endl;
      break;
  }
}

int main(int argc, const char **argv) {
  if (argc < 2) {
    printf("input command is invalid\n");
    usage();
    return lite::RET_ERROR;
  }
  printf("=======run benchmark======\n");

  const char *model_buffer = nullptr;
  int model_size = 0;
  // read .bin file by ReadBinaryFile;
  if (argc >= 3) {
    model_buffer = static_cast<const char *>(ReadInputData(argv[2], &model_size));
  }

  lite::Context *context = nullptr;
  if (argc >= 7) {
    // config benchmark context
    context = new (std::nothrow) lite::Context();
    if (context == nullptr) {
      return lite::RET_ERROR;
    }
    context->thread_num_ = atoi(argv[5]);
    if (context->thread_num_ < 1) {
      printf("Thread number error! It should be greater than 0\n");
      return lite::RET_ERROR;
    }
    context->device_list_.resize(1);
    context->device_list_[0].device_type_ = lite::DT_CPU;
    context->device_list_[0].device_info_.cpu_device_info_.enable_float16_ = false;
    lite::CpuBindMode bind_mode = static_cast<lite::CpuBindMode>(atoi(argv[6]));
    if (bind_mode < lite::NO_BIND || bind_mode > lite::MID_CPU) {
      printf("Thread bind mode error! 0: No bind, 1: Bind hign cpu, 2: Bind mid cpu.\n");
      return lite::RET_ERROR;
    }
    context->device_list_[0].device_info_.cpu_device_info_.cpu_bind_mode_ = bind_mode;
    printf("context: ThreadNum: %d, BindMode: %d\n", context->thread_num_,
           context->device_list_[0].device_info_.cpu_device_info_.cpu_bind_mode_);
  }

  session::LiteSession *session = mindspore::session::LiteSession::CreateSession(model_buffer, model_size, context);
  if (session == nullptr) {
    printf("create lite session failed\n");
    return lite::RET_ERROR;
  }
  delete[] model_buffer;

  // set model inputs tensor data
  Vector<tensor::MSTensor *> inputs = session->GetInputs();
  size_t inputs_num = inputs.size();
  void *inputs_binbuf[inputs_num];
  int inputs_size[inputs_num];
  for (size_t i = 0; i < inputs_num; ++i) {
    inputs_size[i] = inputs[i]->Size();
  }
  int ret = ReadInputsFile(const_cast<char *>(argv[1]), inputs_binbuf, inputs_size, inputs_num);
  if (ret != lite::RET_OK) {
    delete session;
    return lite::RET_ERROR;
  }
  for (size_t i = 0; i < inputs_num; ++i) {
    void *input_data = inputs[i]->MutableData();
    memcpy(input_data, inputs_binbuf[i], inputs_size[i]);
  }

  if (argc >= 4) {
    int loop_count = atoi(argv[3]);
    printf("\nloop count: %d\n", loop_count);
    uint64_t start_time = GetTimeUs();
    for (int i = 0; i < loop_count; ++i) {
      ret = session->RunGraph();
      if (ret != lite::RET_OK) {
        delete session;
        return lite::RET_ERROR;
      }
    }
    uint64_t end_time = GetTimeUs();
    float total_time = (float)(end_time - start_time) / 1000.0f;
    printf("total time: %.5fms, per time: %.5fms\n", total_time, total_time / loop_count);
  }
  ret = session->RunGraph();
  if (ret != lite::RET_OK) {
    delete session;
    return lite::RET_ERROR;
  }

  printf("\noutputs: \n");
  Vector<String> outputs_name = session->GetOutputTensorNames();
  Vector<tensor::MSTensor *> outputs;
  for (const auto &name : outputs_name) {
    auto output = session->GetOutputByTensorName(name);
    outputs.push_back(output);
    TensorToString(output);
  }
  if (argc >= 5) {
    lite::Calibrator *calibrator = new (std::nothrow) lite::Calibrator();
    if (calibrator == nullptr) {
      delete session;
      return lite::RET_NULL_PTR;
    }
    ret = calibrator->ReadCalibData(argv[4]);
    if (ret != lite::RET_OK) {
      delete session;
      delete calibrator;
      return lite::RET_ERROR;
    }
    ret = calibrator->CompareOutputs(outputs);
    if (ret != lite::RET_OK) {
      delete session;
      delete calibrator;
      return lite::RET_ERROR;
    }
    delete calibrator;
  }
  printf("========run success=======\n");
  delete session;
  session = nullptr;
  if (context != nullptr) {
    delete context;
    context = nullptr;
  }
  for (size_t i = 0; i < inputs_num; ++i) {
    free(inputs_binbuf[i]);
    inputs_binbuf[i] = nullptr;
  }
  return lite::RET_OK;
}

)RAW";
}  // namespace mindspore::lite::micro