mindspore/patches/0014-train-0002.patch

From 6576d2861ab7e95c7e7b6a284ebc5f3159f4398d Mon Sep 17 00:00:00 2001
From: z00574805 <z00574805@notesmail.huawei.com/>
Date: Wed, 24 May 2023 11:04:47 +0800
Subject: [PATCH 2/5] xiaoyi-0002

---
 mindspore/lite/tools/converter/converter.cc   |   2 +-
 .../converter/micro/cmake/file_list.cmake     |  13 +
 .../micro/coder/allocator/allocator.cc        |  19 +-
 .../micro/coder/allocator/allocator.h         |   9 +-
 .../lite/tools/converter/micro/coder/coder.cc |   8 +-
 .../lite/tools/converter/micro/coder/coder.h  |   4 +-
 .../lite/tools/converter/micro/coder/graph.cc |  30 +-
 .../lite/tools/converter/micro/coder/graph.h  |   2 +-
 .../nnacl/fp16/activation_fp16_coder.cc       |  84 +++++
 .../nnacl/fp16/activation_fp16_coder.h        |  37 +++
 .../nnacl/fp16/arithmetic_fp16_coder.cc       | 175 +++++++++++
 .../nnacl/fp16/arithmetic_fp16_coder.h        |  47 +++
 .../nnacl/fp16/avg_pooling_fp16_coder.cc      |  87 ++++++
 .../nnacl/fp16/avg_pooling_fp16_coder.h       |  36 +++
 .../opcoders/nnacl/fp16/concat_fp16_coder.cc  |  88 ++++++
 .../opcoders/nnacl/fp16/concat_fp16_coder.h   |  42 +++
 .../nnacl/fp16/layernorm_fp16_coder.cc        |  56 ++++
 .../nnacl/fp16/layernorm_fp16_coder.h         |  37 +++
 .../nnacl/fp16/matmul_fp16_base_coder.cc      | 286 ++++++++++++++++++
 .../nnacl/fp16/matmul_fp16_base_coder.h       |  58 ++++
 .../opcoders/nnacl/fp16/matmul_fp16_coder.cc  |  79 +++++
 .../opcoders/nnacl/fp16/matmul_fp16_coder.h   |  44 +++
 .../opcoders/nnacl/fp16/reduce_fp16_coder.cc  |  75 +++++
 .../opcoders/nnacl/fp16/reduce_fp16_coder.h   |  40 +++
 .../opcoders/nnacl/fp16/resize_fp16_coder.cc  | 108 +++++++
 .../opcoders/nnacl/fp16/resize_fp16_coder.h   |  41 +++
 .../nnacl/fp16/transpose_fp16_coder.cc        | 140 +++++++++
 .../nnacl/fp16/transpose_fp16_coder.h         |  43 +++
 .../nnacl/fp32/activation_fp32_coder.cc       |   8 +-
 .../nnacl/fp32/activation_fp32_coder.h        |   2 +-
 .../nnacl/fp32/arithmetic_fp32_coder.cc       |  38 ++-
 .../nnacl/fp32/arithmetic_fp32_coder.h        |  34 ++-
 .../opcoders/nnacl/fp32/concat_fp32_coder.h   |   2 +-
 .../opcoders/nnacl/fp32/exp_fp32_coder.cc     |   2 +-
 .../opcoders/nnacl/fp32/gather_fp32_coder.cc  |   2 +
 .../nnacl/fp32/layernorm_fp32_coder.cc        |  81 +++++
 .../nnacl/fp32/layernorm_fp32_coder.h         |  40 +++
 .../opcoders/nnacl/fp32/lstm_fp32_coder.cc    |  18 +-
 .../nnacl/fp32/matmul_fp32_base_coder.cc      | 104 ++++---
 .../nnacl/fp32/matmul_fp32_base_coder.h       |  29 +-
 .../opcoders/nnacl/fp32/pooling_fp32_coder.h  |   2 +-
 .../opcoders/nnacl/fp32/reduce_fp32_coder.cc  |  40 +--
 .../opcoders/nnacl/fp32/reduce_fp32_coder.h   |  14 +-
 .../opcoders/nnacl/fp32/resize_fp32_coder.cc  |  31 +-
 .../opcoders/nnacl/fp32/resize_fp32_coder.h   |  11 +-
 .../opcoders/nnacl/fp32/scale_fp32_coder.cc   |  38 +--
 .../opcoders/nnacl/fp32/scale_fp32_coder.h    |   2 -
 .../opcoders/nnacl/fp32/split_fp32_coder.cc   |  77 +++++
 .../opcoders/nnacl/fp32/split_fp32_coder.h    |  37 +++
 .../nnacl/fp32/transpose_fp32_coder.cc        |  14 +-
 .../nnacl/fp32/transpose_fp32_coder.h         |  12 +-
 .../nnacl_serializer/nnacl_fp32_serializer.cc |  19 ++
 .../nnacl_serializer/nnacl_fp32_serializer.h  |   6 +
 .../tools/converter/micro/coder/session.cc    |   5 +-
 .../tools/converter/micro/coder/session.h     |   3 +-
 55 files changed, 2140 insertions(+), 221 deletions(-)
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.h
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.cc
 create mode 100644 mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.h

diff --git a/mindspore/lite/tools/converter/converter.cc b/mindspore/lite/tools/converter/converter.cc
index eaa18d6b..944ed29c 100644
--- a/mindspore/lite/tools/converter/converter.cc
+++ b/mindspore/lite/tools/converter/converter.cc
@@ -799,7 +799,7 @@ int RunConverter(const std::shared_ptr<ConverterPara> &param, void **model_data,
   if (param->microParam.enable_micro) {
     status = micro::Coder::MicroSourceCodeGeneration(*meta_graph, param->output_file, param->microParam.codegen_mode,
                                                      param->microParam.target, param->microParam.support_parallel,
-                                                     param->microParam.debug_mode);
+                                                     param->microParam.debug_mode, param->weight_fp16);
     if (status != RET_OK) {
       delete meta_graph;
       CONVERTER_LOG_ERROR("MICRO CODEGEN FAILED:" << status << " " << GetErrorInfo(status));
diff --git a/mindspore/lite/tools/converter/micro/cmake/file_list.cmake b/mindspore/lite/tools/converter/micro/cmake/file_list.cmake
index 843b523e..9ae54538 100644
--- a/mindspore/lite/tools/converter/micro/cmake/file_list.cmake
+++ b/mindspore/lite/tools/converter/micro/cmake/file_list.cmake
@@ -66,6 +66,17 @@ set(CODER_OPCODERS_SRC
         ${MICRO_DIR}/coder/opcoders/cmsis-nn/int8/pooling_int8_coder.cc
         ${MICRO_DIR}/coder/opcoders/cmsis-nn/int8/reshape_int8_coder.cc
         ${MICRO_DIR}/coder/opcoders/cmsis-nn/int8/softmax_int8_coder.cc
+        #### nnacl fp16 coder
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/activation_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/concat_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/transpose_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/matmul_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/reduce_fp16_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp16/resize_fp16_coder.cc
         #### nnacl fp32 coder
         ${MICRO_DIR}/coder/opcoders/nnacl/fp32/activation_fp32_coder.cc
         ${MICRO_DIR}/coder/opcoders/nnacl/fp32/addn_fp32_coder.cc
@@ -99,6 +110,8 @@ set(CODER_OPCODERS_SRC
         ${MICRO_DIR}/coder/opcoders/nnacl/fp32/exp_fp32_coder.cc
         ${MICRO_DIR}/coder/opcoders/nnacl/fp32/deconv2d_fp32_coder.cc
         ${MICRO_DIR}/coder/opcoders/nnacl/fp32/prelu_fp32_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.cc
+        ${MICRO_DIR}/coder/opcoders/nnacl/fp32/split_fp32_coder.cc
         #### nnacl int8 coder
         ${MICRO_DIR}/coder/opcoders/nnacl/int8/activation_int8_coder.cc
         ${MICRO_DIR}/coder/opcoders/nnacl/int8/affine_int8_coder.cc
diff --git a/mindspore/lite/tools/converter/micro/coder/allocator/allocator.cc b/mindspore/lite/tools/converter/micro/coder/allocator/allocator.cc
index 99ef06de..9c5839b4 100644
--- a/mindspore/lite/tools/converter/micro/coder/allocator/allocator.cc
+++ b/mindspore/lite/tools/converter/micro/coder/allocator/allocator.cc
@@ -22,11 +22,13 @@

 namespace mindspore::lite::micro {
 namespace {
-const std::map<TypeId, size_t> size_map = {{kNumberTypeFloat, sizeof(float)},   {kNumberTypeFloat32, sizeof(float)},
-                                           {kNumberTypeInt32, sizeof(int32_t)}, {kNumberTypeInt16, sizeof(int16_t)},
-                                           {kNumberTypeInt8, sizeof(int8_t)},   {kNumberTypeUInt8, sizeof(uint8_t)}};
+const std::map<TypeId, size_t> size_map = {{kNumberTypeFloat, sizeof(float)},      {kNumberTypeFloat32, sizeof(float)},
+                                           {kNumberTypeInt32, sizeof(int32_t)},    {kNumberTypeInt16, sizeof(int16_t)},
+                                           {kNumberTypeFloat16, sizeof(uint16_t)}, {kNumberTypeInt8, sizeof(int8_t)},
+                                           {kNumberTypeUInt8, sizeof(uint8_t)}};
 }
-void *MemoryAllocator::MallocWeightTensor(TypeId type_id, size_t size, MallocType type) {
+void *MemoryAllocator::MallocWeightTensor(TypeId type_id, size_t size, MallocType type,
+                                          const std::string &tensor_name) {
   auto item = size_map.find(type_id);
   MS_CHECK_TRUE_RET_NULL(item != size_map.end(), "unsupported type idnex");

@@ -36,6 +38,7 @@ void *MemoryAllocator::MallocWeightTensor(TypeId type_id, size_t size, MallocTyp
   auto cate = type == kOfflinePackWeight ? lite::Category::CONST_TENSOR : lite::Category::VAR;
   Tensor *weight = new (std::nothrow) lite::Tensor(type_id, shape, mindspore::NHWC, cate);
   MS_CHECK_PTR_RET_NULL(weight);
+  weight->set_tensor_name(tensor_name);
   std::string runtime_addr = kWeightPrefixName + std::to_string(weight_index_++);
   malloc_weights_addr_.insert(std::make_pair(weight, runtime_addr));
   if (type == kOfflinePackWeight) {
@@ -152,4 +155,12 @@ int MemoryAllocator::Assign(const std::vector<Tensor *> &inputs,
   RecordOriginWeightsAddr(nodes);
   return AssignTensors(nodes);
 }
+
+void MemoryAllocator::MarkSharedWeight(const Tensor *src, void *pack_weight) {
+  shared_pack_weights_[src] = pack_weight;
+}
+
+void *MemoryAllocator::GetSharedWeightAddr(const Tensor *src) {
+  return shared_pack_weights_.find(src) == shared_pack_weights_.end() ? nullptr : shared_pack_weights_[src];
+}
 }  // namespace mindspore::lite::micro
diff --git a/mindspore/lite/tools/converter/micro/coder/allocator/allocator.h b/mindspore/lite/tools/converter/micro/coder/allocator/allocator.h
index f8decca1..8a1331fb 100644
--- a/mindspore/lite/tools/converter/micro/coder/allocator/allocator.h
+++ b/mindspore/lite/tools/converter/micro/coder/allocator/allocator.h
@@ -65,9 +65,9 @@ class MemoryAllocator {
    * in view of weight, bias and workspace
    */

-  void *Malloc(TypeId type_id, size_t size, MallocType type) {
+  void *Malloc(TypeId type_id, size_t size, MallocType type, const std::string &tensor_name = "") {
     if (type != kWorkspace) {
-      return MallocWeightTensor(type_id, size, type);
+      return MallocWeightTensor(type_id, size, type, tensor_name);
     }
     if (size == 0 || size >= UINT_MAX) {
       return nullptr;
@@ -138,7 +138,9 @@ class MemoryAllocator {
   std::map<std::string, Tensor *> saved_weights() const { return saved_weights_addr_; }
   size_t total_buffer_size() const { return tensors_size_ + workspace_size_; }
   void enable_is_next() { is_next_ = true; }
-  void *MallocWeightTensor(TypeId type_id, size_t size, MallocType type);
+  void *MallocWeightTensor(TypeId type_id, size_t size, MallocType type, const std::string &tensor_name = "");
+  void MarkSharedWeight(const Tensor *src, void *pack_weight);
+  void *GetSharedWeightAddr(const Tensor *src);

  private:
   int AssignTensors(const std::vector<std::unique_ptr<OperatorCoder>> &nodes);
@@ -162,6 +164,7 @@ class MemoryAllocator {
   std::map<Tensor *, std::string> origin_weights_addr_;
   std::map<Tensor *, std::string> malloc_weights_addr_;
   std::map<Tensor *, std::string> tensors_addr_;
+  std::map<const Tensor *, void *> shared_pack_weights_;
 };
 }  // namespace mindspore::lite::micro
 #endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_ALLOCATOR_ALLOCATOR_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/coder.cc b/mindspore/lite/tools/converter/micro/coder/coder.cc
index 9711d4b9..cca4687e 100644
--- a/mindspore/lite/tools/converter/micro/coder/coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/coder.cc
@@ -29,13 +29,13 @@
 #include "tools/converter/micro/coder/generator/component/component.h"

 namespace mindspore::lite::micro {
-int Coder::Run(const void *model_buff, size_t size) {
+int Coder::Run(const void *model_buff, size_t size, bool enableFp16) {
   session_ = CreateCoderSession();
   if (session_ == nullptr) {
     MS_LOG(ERROR) << "new session failed while running!";
     return RET_ERROR;
   }
-  STATUS status = session_->Init(model_buff, size);
+  STATUS status = session_->Init(model_buff, size, enableFp16);
   if (status != RET_OK) {
     MS_LOG(ERROR) << "Init session failed!";
     return RET_ERROR;
@@ -94,7 +94,7 @@ bool Coder::InitPath(const std::string &output_path) {

 int Coder::MicroSourceCodeGeneration(const schema::MetaGraphT &graph, const std::string &output_path,
                                      const std::string &codegen_mode, const std::string &device, bool support_parallel,
-                                     bool debug_mode) {
+                                     bool debug_mode, bool enableFp16) {
   flatbuffers::FlatBufferBuilder builder(kFlatbuffersBuilderInitSize);
   auto offset = schema::MetaGraph::Pack(builder, &graph);
   builder.Finish(offset);
@@ -111,7 +111,7 @@ int Coder::MicroSourceCodeGeneration(const schema::MetaGraphT &graph, const std:
     MS_LOG(ERROR) << "Codegen init Error";
     return RET_ERROR;
   }
-  status = code_gen.Run(builder.GetBufferPointer(), size);
+  status = code_gen.Run(builder.GetBufferPointer(), size, enableFp16);
   if (status != RET_OK) {
     MS_LOG(ERROR) << "Codegen Run Error";
     return RET_ERROR;
diff --git a/mindspore/lite/tools/converter/micro/coder/coder.h b/mindspore/lite/tools/converter/micro/coder/coder.h
index 42ba153f..96531e6f 100644
--- a/mindspore/lite/tools/converter/micro/coder/coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/coder.h
@@ -32,11 +32,11 @@ class Coder final {
   ~Coder() = default;
   static int MicroSourceCodeGeneration(const schema::MetaGraphT &graph, const std::string &output_path,
                                        const std::string &codegen_mode, const std::string &device,
-                                       bool support_parallel, bool debug_mode);
+                                       bool support_parallel, bool debug_mode, bool enableFp16);

  private:
   int Init(const std::string code_mode, const std::string target, bool support_parallel, bool debug_mode_) const;
-  int Run(const void *model_buff, size_t size);
+  int Run(const void *model_buff, size_t size, bool enableFp16);
   bool InitPath(const std::string &output_path);
   std::shared_ptr<CoderSession> session_{nullptr};

diff --git a/mindspore/lite/tools/converter/micro/coder/graph.cc b/mindspore/lite/tools/converter/micro/coder/graph.cc
index b9fa5f2f..ee45d042 100644
--- a/mindspore/lite/tools/converter/micro/coder/graph.cc
+++ b/mindspore/lite/tools/converter/micro/coder/graph.cc
@@ -28,6 +28,7 @@
 #include "securec/include/securec.h"
 #include "src/common/prim_util.h"
 #include "src/runtime/lite_model.h"
+#include "base/float16.h"

 namespace mindspore::lite::micro {
 CoderGraph::~CoderGraph() {
@@ -41,7 +42,7 @@ CoderGraph::~CoderGraph() {
   }
 }

-int CoderGraph::ConvertTensors() {
+int CoderGraph::ConvertTensors(bool enableFp16) {
   if (model_ == nullptr) {
     MS_LOG(ERROR) << "Graph model is nullptr";
     return RET_ERROR;
@@ -86,14 +87,27 @@ int CoderGraph::ConvertTensors() {
     if (origin_tensor->nodeType() == NodeType_ValueNode && origin_tensor->data() != nullptr &&
         origin_tensor->data()->size() > 0) {
       // copy data, this is weight && bias
-      MS_CHECK_TRUE_WITH_EXE(origin_tensor->data()->size() > 0, "invalid meta_tensor data size.", delete dstTensor);
-      auto data_size = static_cast<size_t>(origin_tensor->data()->size());
-      MS_CHECK_RET_CODE_WITH_EXE(dstTensor->MallocData(), "dst tensor malloc data failed!", delete dstTensor);
-      void *dst_data = dstTensor->data();
-      MS_CHECK_RET_CODE_WITH_EXE(memcpy_s(dst_data, dstTensor->Size(), origin_tensor->data()->data(), data_size),
-                                 "memcpy_s copy data failed!", delete dstTensor);
-      dstTensor->set_data(dst_data);
+      if (enableFp16 && origin_data_type == kNumberTypeFloat32) {
+        dstTensor->set_data_type(kNumberTypeFloat16);
+        auto data = dstTensor->MutableData();
+        MS_CHECK_TRUE_WITH_EXE(data != nullptr, "dst tensor malloc data failed!", delete dstTensor);
+        auto fp32_data = reinterpret_cast<const float *>(origin_tensor->data()->data());
+        auto fp16_data = reinterpret_cast<float16 *>(data);
+        CHECK_NULL_RETURN(fp32_data);
+        CHECK_NULL_RETURN(fp16_data);
+        for (int64_t j = 0; j < dstTensor->ElementsNum(); ++j) {
+          fp16_data[j] = float16(fp32_data[j]);
+        }
+
+      } else {
+        MS_CHECK_RET_CODE_WITH_EXE(memcpy_s(dstTensor->MutableData(), dstTensor->Size(), origin_tensor->data()->data(),
+                                            origin_tensor->data()->size()),
+                                   "memcpy_s copy data failed!", delete dstTensor);
+      }
+    } else if (enableFp16 && origin_data_type == kNumberTypeFloat32) {
+      dstTensor->set_data_type(kNumberTypeFloat16);
     }
+
     if (origin_tensor->name() != nullptr) {
       dstTensor->set_tensor_name(origin_tensor->name()->str());
     }
diff --git a/mindspore/lite/tools/converter/micro/coder/graph.h b/mindspore/lite/tools/converter/micro/coder/graph.h
index 5fb22f15..35d3cb2b 100644
--- a/mindspore/lite/tools/converter/micro/coder/graph.h
+++ b/mindspore/lite/tools/converter/micro/coder/graph.h
@@ -35,7 +35,7 @@ class CoderGraph {
   explicit CoderGraph(Model *model) : model_(model) {}
   ~CoderGraph();

-  int ConvertTensors();
+  int ConvertTensors(bool enableFp16);
   int InitGraphInOutTensors();

   void SetAllTensors(const std::vector<Tensor *> &all_tensors);
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.cc
new file mode 100644
index 00000000..0fdf0a7f
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.cc
@@ -0,0 +1,84 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "coder/opcoders/nnacl/fp16/activation_fp16_coder.h"
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/opcoders/file_collector.h"
+
+using mindspore::schema::PrimitiveType_Activation;
+
+namespace mindspore::lite::micro::nnacl {
+int ActivationFP16Coder::Prepare(CoderContext *const context) {
+  if (input_tensor_->data_type() != kNumberTypeFloat16) {
+    MS_LOG(INFO) << "Input tensor data type is invalid";
+    return RET_INPUT_PARAM_INVALID;
+  }
+  return RET_OK;
+}
+
+int ActivationFP16Coder::DoCode(CoderContext *const context) {
+  // attribute
+  auto *activation_parameter = reinterpret_cast<ActivationParameter *>(parameter_);
+  MS_CHECK_PTR(activation_parameter);
+  int count = input_tensor_->ElementsNum();
+  Collect(context,
+          {
+            "nnacl/fp16/activation_fp16.h",
+          },
+          {
+            "activation_fp16.c",
+          });
+  NNaclFp32Serializer code;
+
+  switch (activation_parameter->type_) {
+    case schema::ActivationType_RELU:
+      code.CodeFunction("ReluFp16", input_tensor_, output_tensor_, count);
+      break;
+    case schema::ActivationType_RELU6:
+      code.CodeFunction("Relu6Fp16", input_tensor_, output_tensor_, count);
+      break;
+    case schema::ActivationType_LEAKY_RELU:
+      code.CodeFunction("LReluFp16", input_tensor_, output_tensor_, count, activation_parameter->alpha_);
+      break;
+    case schema::ActivationType_SIGMOID:
+      code.CodeFunction("SigmoidFp16", input_tensor_, output_tensor_, count);
+      break;
+    case schema::ActivationType_TANH:
+      code.CodeFunction("TanhFp16", input_tensor_, output_tensor_, count);
+      break;
+    case schema::ActivationType_HSWISH:
+      code.CodeFunction("HSwishFp16", input_tensor_, output_tensor_, count);
+      break;
+    case schema::ActivationType_SWISH:
+      code.CodeFunction("SwishFp16", input_tensor_, output_tensor_, count);
+      break;
+    case schema::ActivationType_HSIGMOID:
+      code.CodeFunction("HSigmoidFp16", input_tensor_, output_tensor_, count);
+      break;
+    case schema::ActivationType_ELU:
+      code.CodeFunction("EluFp16", input_tensor_, output_tensor_, count, activation_parameter->alpha_);
+      break;
+    default:
+      MS_LOG(ERROR) << "Activation type error";
+      return RET_ERROR;
+  }
+  MS_LOG(DEBUG) << "ActivationFP16Code has been called";
+  context->AppendCode(code.str());
+  return lite::RET_OK;
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Activation, CPUOpCoderCreator<ActivationFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Activation, CPUOpCoderCreator<ActivationFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.h
new file mode 100644
index 00000000..0390991f
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/activation_fp16_coder.h
@@ -0,0 +1,37 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_ACTIVATION_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_ACTIVATION_FP16_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/nnacl/fp32/activation_fp32_coder.h"
+
+namespace mindspore::lite::micro::nnacl {
+class ActivationFP16Coder final : public ActivationFP32Coder {
+ public:
+  ActivationFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                      const LiteGraph::Node *node, size_t node_index, Target target)
+      : ActivationFP32Coder(in_tensors, out_tensors, node, node_index, target) {}
+
+  ~ActivationFP16Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MICRO_CODER_OPCODERS_FP16__CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.cc
new file mode 100644
index 00000000..a9cdde78
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.cc
@@ -0,0 +1,175 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/parallel.h"
+#include "coder/log.h"
+#include "nnacl/broadcast_to_parameter.h"
+
+namespace mindspore::lite::micro::nnacl {
+void ArithmeticFP16Coder::InitFunTable() {
+  fun_table_ = {
+    {PrimitiveType_MulFusion, schema::ActivationType_RELU, "ElementMulReluFp16", "", "", "", ""},
+    {PrimitiveType_MulFusion, schema::ActivationType_RELU6, "ElementMulRelu6Fp16", "", "", "", ""},
+    {PrimitiveType_MulFusion, schema::ActivationType_NO_ACTIVATION, "ElementMulFp16", "", "", "", ""},
+    {PrimitiveType_AddFusion, schema::ActivationType_RELU, "ElementAddReluFp16", "", "", "", ""},
+    {PrimitiveType_AddFusion, schema::ActivationType_RELU6, "ElementAddRelu6Fp16", "", "", "", ""},
+    {PrimitiveType_AddFusion, schema::ActivationType_NO_ACTIVATION, "ElementAddFp16", "", "", "", ""},
+    {PrimitiveType_SubFusion, schema::ActivationType_RELU, "ElementSubReluFp16", "", "", "", ""},
+    {PrimitiveType_SubFusion, schema::ActivationType_RELU6, "ElementSubRelu6Fp16", "", "", "", ""},
+    {PrimitiveType_SubFusion, schema::ActivationType_NO_ACTIVATION, "ElementSubFp16", "", "", "", ""},
+    {PrimitiveType_DivFusion, schema::ActivationType_RELU, "ElementDivReluFp16", "", "", "", ""},
+    {PrimitiveType_DivFusion, schema::ActivationType_RELU6, "ElementDivRelu6Fp16", "", "", "", ""},
+    {PrimitiveType_DivFusion, schema::ActivationType_NO_ACTIVATION, "ElementDivFp16", "", "", "", ""},
+    {PrimitiveType_RealDiv, schema::ActivationType_RELU, "ElementDivReluFp16", "", "", "", ""},
+    {PrimitiveType_RealDiv, schema::ActivationType_RELU6, "ElementDivRelu6Fp16", "", "", "", ""},
+    {PrimitiveType_RealDiv, schema::ActivationType_NO_ACTIVATION, "ElementDivFp16", "", "", "", ""},
+    {PrimitiveType_LogicalAnd, schema::ActivationType_NO_ACTIVATION, "ElementLogicalAndFp16", "", "", "", ""},
+    {PrimitiveType_LogicalOr, schema::ActivationType_NO_ACTIVATION, "ElementLogicalOrFp16", "", "", "", ""},
+    {PrimitiveType_Maximum, schema::ActivationType_NO_ACTIVATION, "ElementMaximumFp16", "", "", "", ""},
+    {PrimitiveType_Minimum, schema::ActivationType_NO_ACTIVATION, "ElementMinimumFp16", "", "", "", ""},
+    {PrimitiveType_FloorMod, schema::ActivationType_NO_ACTIVATION, "ElementFloorModFp16", "", "", "", ""},
+    {PrimitiveType_FloorDiv, schema::ActivationType_NO_ACTIVATION, "ElementFloorDivFp16", "", "", "", ""},
+    {PrimitiveType_SquaredDifference, schema::ActivationType_NO_ACTIVATION, "ElementSquaredDifferenceFp16", "", "", "",
+     ""}};
+}
+
+int ArithmeticFP16Coder::Prepare(CoderContext *const context) {
+  if (input_tensor_->data_type() != kNumberTypeFloat16 ||
+      input_tensors_.at(kWeightIndex)->data_type() != kNumberTypeFloat16 ||
+      output_tensor_->data_type() != kNumberTypeFloat16) {
+    MS_LOG(ERROR) << "Tensor data type is invalid";
+    return lite::RET_INPUT_PARAM_INVALID;
+  }
+  return ArithmeticFP32Coder::Prepare(context);
+}
+
+int ArithmeticFP16Coder::ReSize(CoderContext *const context) {
+  CalcMultiplesAndStrides(arithmetic_parameter_);
+  return RET_OK;
+}
+
+int ArithmeticFP16Coder::ExecuteCode(const std::string &input0, const std::string &input1, const std::string &output,
+                                     int size, CoderContext *const context, NNaclFp32Serializer *const code) {
+  if (arithmetic_func_str_.empty()) {
+    return RET_ERROR;
+  }
+  for (size_t i = 0; i < fun_table_.size(); i++) {
+    if (fun_table_[i].primitive_type_ == arithmetic_parameter_->op_parameter_.type_ &&
+        fun_table_[i].activation_type_ == arithmetic_parameter_->activation_type_) {
+      code->CodeFunction(fun_table_[i].func_, input0, input1, output, size);
+      break;
+    }
+  }
+  context->AppendCode(code->str());
+  return RET_OK;
+}
+
+int ArithmeticFP16Coder::DoCode(CoderContext *const context) {
+  int element_num = output_tensor_->ElementsNum();
+  input0_ptr_str_ = allocator_->GetRuntimeAddr(input_tensor_, input_tensor_->IsConst());
+  input1_ptr_str_ = allocator_->GetRuntimeAddr(filter_tensor_, filter_tensor_->IsConst());
+  output_ptr_str_ = allocator_->GetRuntimeAddr(output_tensor_);
+  NNaclFp32Serializer code;
+  Collect(context,
+          {
+            "nnacl/fp16/arithmetic_fp16.h",
+            "nnacl/base/broadcast_to.h",
+          },
+          {
+            "arithmetic_fp16.c",
+            "arithmetic_base.c",
+            "broadcast_to.c",
+          });
+
+  // all elements eltwise calculation
+  ChooseArithmeticFunc(false);
+  auto in0_shape = input_tensor_->shape();
+  auto in1_shape = filter_tensor_->shape();
+  auto out_shape = output_tensor_->shape();
+  BroadcastShapeInfo broadcast_info;
+  auto ret = memset_s(&broadcast_info, sizeof(BroadcastShapeInfo), 0, sizeof(BroadcastShapeInfo));
+  MS_CHECK_TRUE_MSG(ret == EOK, RET_ERROR, "memset failed.");
+  ret = memcpy_s(broadcast_info.output_shape_, MAX_SHAPE_SIZE * sizeof(int), out_shape.data(),
+                 out_shape.size() * sizeof(int));
+  MS_CHECK_TRUE_MSG(ret == EOK, RET_ERROR, "memcpy output-info failed.");
+  broadcast_info.output_shape_size_ = static_cast<int>(out_shape.size());
+  if (in0_shape != out_shape) {
+    ret = memcpy_s(broadcast_info.input_shape_, MAX_SHAPE_SIZE * sizeof(int), in0_shape.data(),
+                   in0_shape.size() * sizeof(int));
+    MS_CHECK_TRUE_MSG(ret == EOK, RET_ERROR, "memcpy in0-info failed.");
+    broadcast_info.input_shape_size_ = static_cast<int>(in0_shape.size());
+    code.CodeStruct("in0_broadcast_info", broadcast_info);
+    code.CodeFunction("BroadcastToSize16", input0_ptr_str_, "&in0_broadcast_info", output_ptr_str_);
+    input0_ptr_str_ = output_ptr_str_;
+  }
+  if (in1_shape != out_shape) {
+    ret = memcpy_s(broadcast_info.input_shape_, MAX_SHAPE_SIZE * sizeof(int), in1_shape.data(),
+                   in1_shape.size() * sizeof(int));
+    MS_CHECK_TRUE_MSG(ret == EOK, RET_ERROR, "memcpy in1-info failed.");
+    broadcast_info.input_shape_size_ = static_cast<int>(in1_shape.size());
+    code.CodeStruct("in1_broadcast_info", broadcast_info);
+    auto temp = output_ptr_str_;
+    if (input0_ptr_str_ == output_ptr_str_) {
+      auto temp_data = allocator_->Malloc(kNumberTypeFloat16, output_tensor_->Size(), kWorkspace);
+      MS_CHECK_TRUE_MSG(temp_data != nullptr, RET_NULL_PTR, "malloc running buffer failed.");
+      temp = allocator_->GetRuntimeAddr(temp_data);
+    }
+    code.CodeFunction("BroadcastToSize16", input1_ptr_str_, "&in1_broadcast_info", temp);
+    input1_ptr_str_ = temp;
+  }
+  return ExecuteCode(input0_ptr_str_, input1_ptr_str_, output_ptr_str_, element_num, context, &code);
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_AddFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_MulFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_SubFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_DivFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_RealDiv, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_LogicalAnd, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_LogicalOr, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Maximum, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Minimum, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_FloorDiv, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_FloorMod, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_SquaredDifference, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Equal, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_NotEqual, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Less, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_LessEqual, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Greater, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_GreaterEqual, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Eltwise, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_AddFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_MulFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_SubFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_DivFusion, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_RealDiv, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_LogicalAnd, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_LogicalOr, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Maximum, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Minimum, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_FloorDiv, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_FloorMod, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_SquaredDifference, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Equal, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_NotEqual, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Less, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_LessEqual, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Greater, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_GreaterEqual, CPUOpCoderCreator<ArithmeticFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Eltwise, CPUOpCoderCreator<ArithmeticFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.h
new file mode 100644
index 00000000..60a83419
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/arithmetic_fp16_coder.h
@@ -0,0 +1,47 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_ARITHMETIC_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_ARITHMETIC_FP16_CODER_H_
+
+#include <vector>
+#include <string>
+#include "coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.h"
+#include "nnacl/base/cast_base.h"
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+namespace mindspore::lite::micro::nnacl {
+class ArithmeticFP16Coder final : public ArithmeticFP32Coder {
+ public:
+  ArithmeticFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                      const LiteGraph::Node *node, size_t node_index, Target target)
+      : ArithmeticFP32Coder(in_tensors, out_tensors, node, node_index, target) {}
+
+  ~ArithmeticFP16Coder() override = default;
+
+  int DoCode(CoderContext *const context) override;
+
+ private:
+  int Prepare(CoderContext *const context) override;
+
+  int ReSize(CoderContext *const context) override;
+
+  void InitFunTable() override;
+
+  int ExecuteCode(const std::string &input0, const std::string &input1, const std::string &output, int size,
+                  CoderContext *const context, NNaclFp32Serializer *const code);
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_ARITHMETIC_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.cc
new file mode 100644
index 00000000..97ca75a8
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.cc
@@ -0,0 +1,87 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.h"
+#include <cfloat>
+#include <string>
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/log.h"
+#include "coder/opcoders/parallel.h"
+#include "coder/opcoders/file_collector.h"
+
+using mindspore::schema::PrimitiveType_AvgPoolFusion;
+
+namespace mindspore::lite::micro::nnacl {
+int PoolingFP16Coder::Prepare(CoderContext *const context) {
+  if (input_tensor_->data_type() != kNumberTypeFloat16) {
+    MS_LOG(INFO) << "Input tensor data type is invalid";
+    return RET_INPUT_PARAM_INVALID;
+  }
+  return RET_OK;
+}
+
+int PoolingFP16Coder::DoCode(CoderContext *const context) {
+  // attribute
+  auto pooling_parameter = reinterpret_cast<PoolingParameter *>(parameter_);
+  MS_CHECK_PTR(pooling_parameter);
+  // init struct PoolingParameters
+  pooling_parameter->input_batch_ = input_tensor_->Batch();
+  pooling_parameter->input_channel_ = input_tensor_->Channel();
+  pooling_parameter->input_h_ = input_tensor_->Height();
+  pooling_parameter->input_w_ = input_tensor_->Width();
+  pooling_parameter->output_batch_ = output_tensor_->Batch();
+  pooling_parameter->output_channel_ = output_tensor_->Channel();
+  pooling_parameter->output_h_ = output_tensor_->Height();
+  pooling_parameter->output_w_ = output_tensor_->Width();
+
+  pooling_parameter->thread_num_ = pooling_parameter->op_parameter_.thread_num_;
+
+  NNaclFp32Serializer code;
+  std::string param_name = "pooling_parameter";
+  code.CodeStruct(param_name, *pooling_parameter);
+  float minf = -FLT16_MAX;
+  float maxf = FLT16_MAX;
+  Collect(context,
+          {
+            "nnacl/fp16/pooling_fp16.h",
+          },
+          {
+            "pooling_fp16.c",
+          });
+  switch (pooling_parameter->act_type_) {
+    case ActType_Relu: {
+      minf = 0.f;
+      break;
+    }
+    case ActType_Relu6: {
+      minf = 0.f;
+      maxf = 6.f;
+      break;
+    }
+    default: {
+      MS_LOG(INFO) << "no actype";
+      break;
+    }
+  }
+  code.CodeFunction("AvgPoolingFp16", input_tensor_, output_tensor_, "&pooling_parameter", kDefaultTaskId, minf, maxf);
+
+  MS_LOG(INFO) << "PoolingFp16Code has been called";
+  context->AppendCode(code.str());
+  return lite::RET_OK;
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_AvgPoolFusion, CPUOpCoderCreator<PoolingFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_AvgPoolFusion, CPUOpCoderCreator<PoolingFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.h
new file mode 100644
index 00000000..65a6522d
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/avg_pooling_fp16_coder.h
@@ -0,0 +1,36 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_POOLING_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_POOLING_FP16_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/nnacl/fp32/pooling_fp32_coder.h"
+
+namespace mindspore::lite::micro::nnacl {
+class PoolingFP16Coder final : public PoolingFP32Coder {
+ public:
+  PoolingFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                   const LiteGraph::Node *node, size_t node_index, Target target)
+      : PoolingFP32Coder(in_tensors, out_tensors, node, node_index, target) {}
+  ~PoolingFP16Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_MICRO_CODER_OPCODERS_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.cc
new file mode 100644
index 00000000..fd969963
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.cc
@@ -0,0 +1,88 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "coder/opcoders/nnacl/fp16/concat_fp16_coder.h"
+#include <string>
+#include <vector>
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/parallel.h"
+
+using mindspore::schema::PrimitiveType_Concat;
+
+namespace mindspore::lite::micro::nnacl {
+int ConcatFP16Coder::Prepare(CoderContext *const context) {
+  if (input_tensor_->data_type() != kNumberTypeFloat16) {
+    MS_LOG(INFO) << "Input tensor data type is invalid";
+    return lite::RET_INPUT_PARAM_INVALID;
+  }
+  concat_param_ = reinterpret_cast<ConcatParameter *>(parameter_);
+  MS_CHECK_PTR(concat_param_);
+  return ReSize();
+}
+
+int ConcatFP16Coder::ReSize() {
+  axis_ = concat_param_->axis_ >= 0 ? concat_param_->axis_
+                                    : static_cast<int>(input_tensor_->shape().size()) + concat_param_->axis_;
+  return RET_OK;
+}
+
+int ConcatFP16Coder::DoCode(CoderContext *const context) {
+  Collect(context,
+          {
+            "nnacl/base/concat_base.h",
+          },
+          {
+            "concat_base.c",
+          });
+
+  size_t input_num = input_tensors_.size();
+
+  NNaclFp32Serializer code;
+  code << "\t\tvoid *inputs_addr[] = {";
+  for (size_t i = 0; i < input_num; ++i) {
+    code << allocator_->GetRuntimeAddr(input_tensors_.at(i)) << ", ";
+  }
+  code << "};\n";
+
+  size_t i;
+  for (i = 0; i < input_num; ++i) {
+    code << "\t\tint shape_" << i << "[] = {";
+    for (auto &shape : input_tensors_.at(i)->shape()) {
+      code << shape << ", ";
+    }
+    code << "};\n";
+  }
+
+  code << "\t\tint shape_" << i << "[] = {";
+  for (auto &shape : output_tensor_->shape()) {
+    code << shape << ", ";
+  }
+  code << "};\n";
+
+  code << "\t\tint *inputs_output_shape[] = {";
+  for (i = 0; i <= input_num; ++i) {
+    code << "shape_" << i << ", ";
+  }
+  code << "};\n";
+  code.CodeFunction("Concat", "inputs_addr", input_num, axis_, "inputs_output_shape", output_tensor_->shape().size(),
+                    output_tensor_, 0, 1, sizeof(uint16_t));
+  context->AppendCode(code.str());
+  return RET_OK;
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Concat, CPUOpCoderCreator<ConcatFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Concat, CPUOpCoderCreator<ConcatFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.h
new file mode 100644
index 00000000..6428ac6f
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/concat_fp16_coder.h
@@ -0,0 +1,42 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_CONCAT_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_CONCAT_FP16_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/nnacl/fp32/concat_fp32_coder.h"
+#include "nnacl/concat_parameter.h"
+
+namespace mindspore::lite::micro::nnacl {
+class ConcatFP16Coder final : public ConcatFP32Coder {
+ public:
+  ConcatFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                  const LiteGraph::Node *node, size_t node_index, Target target)
+      : ConcatFP32Coder(in_tensors, out_tensors, node, node_index, target) {}
+  ~ConcatFP16Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+  int DoCode(CoderContext *const context) override;
+
+ private:
+  int ReSize();
+
+  int axis_{0};
+  ConcatParameter *concat_param_{nullptr};
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_CONCAT_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.cc
new file mode 100644
index 00000000..8140786b
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.cc
@@ -0,0 +1,56 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "coder/opcoders/nnacl/fp16/layernorm_fp16_coder.h"
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/parallel.h"
+
+using mindspore::schema::PrimitiveType_LayerNormFusion;
+
+namespace mindspore::lite::micro::nnacl {
+int LayerNormFP16Coder::Prepare(CoderContext *const context) {
+  if ((input_tensor_->data_type() != kNumberTypeFloat16) ||
+      (input_tensors_.at(SECOND_INPUT)->data_type() != kNumberTypeFloat16) ||
+      (input_tensors_.at(THIRD_INPUT)->data_type() != kNumberTypeFloat16)) {
+    MS_LOG(INFO) << "Input tensors data type is invalid";
+    return RET_INPUT_PARAM_INVALID;
+  }
+  return LayerNormFP32Coder::Prepare(context);
+}
+
+int LayerNormFP16Coder::DoCode(CoderContext *const context) {
+  NNaclFp32Serializer code;
+  code.CodeStruct("layer_norm_parm", *param_);
+  Collect(context, {"nnacl/fp16/layer_norm_fp16.h"}, {"layer_norm_fp16.c"});
+
+  if (output_tensors_.size() == C3NUM) {
+    code.CodeFunction("LayerNormFp16", input_tensor_, input_tensors_.at(SECOND_INPUT), input_tensors_.at(THIRD_INPUT),
+                      output_tensor_, output_tensors_.at(SECOND_INPUT), output_tensors_.at(THIRD_INPUT),
+                      "&layer_norm_parm", 0);
+  } else if (output_tensors_.size() == 1) {
+    code.CodeFunction("LayerNormFp16", input_tensor_, input_tensors_.at(SECOND_INPUT), input_tensors_.at(THIRD_INPUT),
+                      output_tensor_, "NULL", "NULL", "&layer_norm_parm", 0);
+  } else {
+    MS_LOG(ERROR) << "LayerNorm should have 1 or 3 output tensors";
+    return RET_ERROR;
+  }
+  context->AppendCode(code.str());
+  return RET_OK;
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_LayerNormFusion, CPUOpCoderCreator<LayerNormFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_LayerNormFusion, CPUOpCoderCreator<LayerNormFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.h
new file mode 100644
index 00000000..df025e3c
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/layernorm_fp16_coder.h
@@ -0,0 +1,37 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_LAYERNORM_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_LAYERNORM_FP16_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/nnacl/fp32/layernorm_fp32_coder.h"
+#include "nnacl/layer_norm_parameter.h"
+
+namespace mindspore::lite::micro::nnacl {
+class LayerNormFP16Coder final : public LayerNormFP32Coder {
+ public:
+  LayerNormFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                     const LiteGraph::Node *node, size_t node_index, Target target)
+      : LayerNormFP32Coder(in_tensors, out_tensors, node, node_index, target) {}
+  ~LayerNormFP16Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_LAYERNORM_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.cc
new file mode 100644
index 00000000..f2aec9d2
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.cc
@@ -0,0 +1,286 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.h"
+#include <string>
+#include <vector>
+#include "coder/log.h"
+#include "coder/opcoders/parallel.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/nnacl/dequant/de_quant.h"
+#include "nnacl/base/cast_base.h"
+
+using mindspore::schema::PrimitiveType_MatMulFusion;
+
+namespace mindspore::lite::micro::nnacl {
+int MatMulFP16BaseCoder::InitBiasData() {
+  if (bias_ptr_) {
+    return RET_OK;
+  }
+  bias_pack_ptr_size_ = static_cast<size_t>(params_->col_align_ * data_type_size_);
+  if (input_tensors_.size() == C3NUM) {
+    bias_ptr_ = allocator_->Malloc(kNumberTypeUInt8, kOnlineSize, kOnlinePackWeight,
+                                   bias_tensor_->tensor_name() + "_online_pack");
+  } else {
+    bias_ptr_ =
+      allocator_->Malloc(kNumberTypeUInt8, kOnlineSize, kOnlinePackWeight, node_->name_ + "_bias_online_pack");
+  }
+  return RET_OK;
+}
+
+int MatMulFP16BaseCoder::InitBufferA() {
+  if (a_pack_ptr_ != nullptr || vec_matmul_) {
+    return RET_OK;
+  }
+  a_pack_ptr_size_ = static_cast<size_t>(params_->batch * params_->row_align_ * params_->deep_ * sizeof(uint16_t));
+  if (params_->a_const_) {
+    a_pack_ptr_ = allocator_->GetSharedWeightAddr(input_tensors_.at(0));
+    if (a_pack_ptr_ == nullptr) {
+      a_pack_ptr_ = allocator_->Malloc(kNumberTypeFloat16, kOnlineSize, kOnlinePackWeight,
+                                       input_tensors_.at(0)->tensor_name() + "_online_pack");
+      allocator_->MarkSharedWeight(input_tensors_.at(0), a_pack_ptr_);
+    } else {
+      a_packed_ = true;
+    }
+  } else {
+    a_pack_ptr_ = allocator_->Malloc(kNumberTypeFloat16, a_pack_ptr_size_, kWorkspace);
+  }
+  MS_CHECK_PTR(a_pack_ptr_);
+  return RET_OK;
+}
+
+int MatMulFP16BaseCoder::InitBufferB() {
+  if (target_ != kARM64) {
+    if (vec_matmul_ && params_->b_transpose_) {
+      return RET_OK;
+    }
+  }
+  return MatMulFP32BaseCoder::InitBufferB();
+}
+
+std::string MatMulFP16BaseCoder::InitMatrixA(NNaclFp32Serializer *const code, NNaclFp32Serializer *const init_code,
+                                             CoderContext *const context, size_t *w_buf) {
+  if (vec_matmul_) {
+    return allocator_->GetRuntimeAddr(input_tensor_, input_tensor_->IsConst());
+  }
+  std::string input_a_str = allocator_->GetRuntimeAddr(input_tensor_);
+  std::string input_a_pack_str = "(float16_t *)" + allocator_->GetRuntimeAddr(a_pack_ptr_);
+  if (params_->a_const_) {
+    init_code->CodeBufferOffsetExpression(a_pack_ptr_, context->weight_name(), context->weight_offset_name(),
+                                          context->weight_size_name(), a_pack_ptr_size_);
+    *w_buf = *w_buf + a_pack_ptr_size_;
+  }
+  NNaclFp32Serializer &pack_node = params_->a_const_ ? *init_code : *code;
+  if (a_batch_ == 1) {
+    if (params_->a_transpose_) {
+      if (target_ == kARM64) {
+        pack_node.CodeFunction("RowMajor2RowNMajorFp16", input_a_str, input_a_pack_str, params_->deep_, params_->row_);
+      } else {
+        pack_node.CodeFunction("RowMajor2Row12MajorFp16", input_a_str, input_a_pack_str, params_->deep_, params_->row_,
+                               false);
+      }
+    } else {
+      if (target_ == kARM64) {
+        pack_node.CodeFunction("RowMajor2ColNMajorFp16", input_a_str, input_a_pack_str, params_->row_, params_->deep_);
+      } else {
+        pack_node.CodeFunction("RowMajor2Col12MajorFp16", input_a_str, input_a_pack_str, params_->row_, params_->deep_,
+                               false);
+      }
+    }
+  } else {
+    pack_node << "  for (int i = 0; i < " << a_batch_ << "; ++i) {\n"
+              << "    float16_t *src = " << input_a_str << " + i * " << params_->deep_ * params_->row_ << ";\n"
+              << "    float16_t *dst = " << input_a_pack_str << " + i * " << params_->deep_ * params_->row_align_
+              << ";\n";
+    if (params_->a_transpose_) {
+      if (target_ == kARM64) {
+        pack_node << "    RowMajor2RowNMajorFp16(src, dst, " << params_->deep_ << ", " << params_->row_ << ");\n";
+      } else {
+        pack_node << "    RowMajor2Row12MajorFp16(src, dst, " << params_->deep_ << ", " << params_->row_
+                  << ", false);\n";
+      }
+    } else {
+      if (target_ == kARM64) {
+        pack_node << "    RowMajor2ColNMajorFp16(src, dst, " << params_->row_ << ", " << params_->deep_ << ");\n";
+      } else {
+        pack_node << "    RowMajor2Col12MajorFp16(src, dst, " << params_->row_ << ", " << params_->deep_
+                  << ", false);\n";
+      }
+    }
+    pack_node << "  }\n";
+  }
+  return input_a_pack_str;
+}
+
+std::string MatMulFP16BaseCoder::InitMatrixB(NNaclFp32Serializer *const code, NNaclFp32Serializer *const init_code,
+                                             CoderContext *const context, size_t *w_buf) {
+  bool no_pack = target_ != kARM64 && vec_matmul_ && params_->b_transpose_;
+  if (no_pack) {
+    return allocator_->GetRuntimeAddr(filter_tensor_, filter_tensor_->IsConst());
+  }
+  std::string input_b_str = allocator_->GetRuntimeAddr(filter_tensor_);
+  std::string input_b_pack_str = "(float16_t *)" + allocator_->GetRuntimeAddr(b_pack_ptr_);
+  if (params_->b_const_) {
+    init_code->CodeBufferOffsetExpression(b_pack_ptr_, context->weight_name(), context->weight_offset_name(),
+                                          context->weight_size_name(), b_pack_ptr_size_);
+    *w_buf = *w_buf + b_pack_ptr_size_;
+  }
+  NNaclFp32Serializer &pack_node = params_->b_const_ ? *init_code : *code;
+  if (target_ != kARM64) {
+    if (vec_matmul_) {
+      if (b_batch_ == 1) {
+        pack_node.CodeFunction("RowMajor2ColMajorFp16", input_b_str, input_b_pack_str, params_->deep_, params_->col_,
+                               false);
+      } else {
+        pack_node << "  for (int i = 0; i < " << b_batch_ << "; ++i) {\n"
+                  << "    float16_t *src = " << input_b_str << " + i * " << params_->deep_ * params_->col_ << ";\n"
+                  << "    float16_t *dst = " << input_b_pack_str << " + i * " << params_->deep_ * params_->col_ << ";\n"
+                  << "    RowMajor2ColMajorFp16(src, dst, " << params_->deep_ << ", " << params_->col_ << ", "
+                  << "false);\n"
+                  << "  }\n";
+      }
+      return input_b_pack_str;
+    }
+  }
+
+  if (b_batch_ == 1) {
+    if (params_->b_transpose_) {
+      pack_node.CodeFunction("RowMajor2Col8MajorFp16", input_b_str, input_b_pack_str, params_->col_, params_->deep_,
+                             false);
+    } else {
+      pack_node.CodeFunction("RowMajor2Row8MajorFp16", input_b_str, input_b_pack_str, params_->deep_, params_->col_,
+                             false);
+    }
+  } else {
+    pack_node << "  for (int i = 0; i < " << b_batch_ << "; ++i) {\n"
+              << "    float16_t *src = " << input_b_str << " + i * " << params_->deep_ * params_->col_ << ";\n"
+              << "    float16_t *dst = " << input_b_pack_str << " + i * " << params_->deep_ * params_->col_align_
+              << ";\n";
+    if (params_->b_transpose_) {
+      pack_node << "    RowMajor2Col8MajorFp16(src, dst, " << params_->col_ << ", " << params_->deep_ << ", false);\n";
+    } else {
+      pack_node << "    RowMajor2Row8MajorFp16(src, dst, " << params_->deep_ << ", " << params_->col_ << ", false);\n";
+    }
+    pack_node << "  }\n";
+  }
+  return input_b_pack_str;
+}
+
+int MatMulFP16BaseCoder::Prepare(CoderContext *const context) {
+  if (input_tensor_->data_type() != kNumberTypeFloat16 || filter_tensor_->data_type() != kNumberTypeFloat16) {
+    MS_LOG(INFO) << "Input tensor data type is invalid";
+    return RET_INPUT_PARAM_INVALID;
+  }
+  row_tile_ = C12NUM;
+  if (target_ == kARM64) {
+    row_tile_ = C4NUM;
+  }
+  auto ret = InitAShape();
+  MS_CHECK_TRUE_MSG(ret == RET_OK, RET_ERROR, "init A-metrics' info failed");
+  ret = InitBShape();
+  MS_CHECK_TRUE_MSG(ret == RET_OK, RET_ERROR, "init B-metrics' info failed");
+  if (params_->row_ == 1) {
+    vec_matmul_ = true;
+  }
+  if (vec_matmul_) {
+    params_->row_align_ = 1;
+    params_->col_align_ = (target_ == kARM64) ? UP_ROUND(params_->col_, C8NUM) : params_->col_;
+  } else {
+    params_->row_align_ = UP_ROUND(params_->row_, row_tile_);
+    params_->col_align_ = UP_ROUND(params_->col_, C8NUM);
+  }
+  MS_CHECK_RET_CODE(InitBufferA(), "InitBufferA failed");
+  MS_CHECK_RET_CODE(InitBufferB(), "InitBufferB failed");
+  MS_CHECK_RET_CODE(InitBiasData(), "InitBias failed");
+  return RET_OK;
+}
+
+int MatMulFP16BaseCoder::CollectFilesForTarget(CoderContext *const context) {
+  Collect(context,
+          {
+            "nnacl/fp16/pack_fp16.h",
+            "nnacl/fp16/matmul_fp16.h",
+          },
+          {
+            "pack_fp16.c",
+            "matmul_fp16.c",
+          });
+  if (target_ == kARM32) {
+    Collect(context, {}, {},
+            {
+              "Matmul12x8Fp16.S",
+              "MatVecMulFp16.S",
+            });
+  } else if (target_ == kARM64) {
+    Collect(context, {}, {},
+            {
+              "MatmulFp16.S",
+              "MatmulFp16Opt.S",
+              "MatVecMulFp16.S",
+              "Matmul12X16Fp16.S",
+              "MatmulBaseFp16Neon.S",
+              "MatmulWinogradFp16.S",
+              "VecMatmulFp16.S",
+            });
+  }
+  return RET_OK;
+}
+
+int MatMulFP16BaseCoder::DoCode(CoderContext *const context) {
+  CollectFilesForTarget(context);
+  NNaclFp32Serializer code, init_code;
+  size_t w_buf_size = 0;
+
+  // do bias packing to init
+  init_code.CodeBufferOffsetExpression(bias_ptr_, context->weight_name(), context->weight_offset_name(),
+                                       context->weight_size_name(), bias_pack_ptr_size_);
+  w_buf_size += bias_pack_ptr_size_;
+  std::string bias_str = "(float16_t *)" + allocator_->GetRuntimeAddr(bias_ptr_);
+  if (input_tensors_.size() == DIMENSION_3D) {
+    auto origin_bias_str = allocator_->GetRuntimeAddr(bias_tensor_);
+    init_code.CodeFunction("memcpy", bias_str, origin_bias_str, bias_tensor_->Size());
+  } else {
+    init_code.CodeFunction("memset", bias_str, 0, bias_pack_ptr_size_);
+  }
+
+  auto input_a_str = InitMatrixA(&code, &init_code, context, &w_buf_size);
+  auto input_b_str = InitMatrixB(&code, &init_code, context, &w_buf_size);
+  auto output_str = allocator_->GetRuntimeAddr(output_tensor_);
+  code << "  for (int i = 0; i < " << params_->batch << "; ++i) {\n";
+  if (vec_matmul_) {
+    code << "    const float16_t *batch_a_ptr = " << input_a_str << " + i * " << params_->deep_ << ";\n";
+    code << "    const float16_t *batch_b_ptr = " << input_b_str << " + i * "
+         << params_->deep_ * (target_ == kARM64 ? params_->col_align_ : params_->col_) << ";\n";
+    code << "      float16_t *batch_c_ptr = " << output_str << " + i * " << params_->row_ * params_->col_ << ";\n  ";
+    code.CodeFunction(target_ == kARM64 ? "VecMatmulFp16" : "MatVecMulFp16", "batch_a_ptr", "batch_b_ptr",
+                      "batch_c_ptr", bias_str, params_->act_type_, params_->deep_, params_->col_);
+  } else {
+    code << "    const float16_t *batch_a_ptr = " << input_a_str << " + i * " << params_->row_align_ * params_->deep_
+         << ";\n";
+    code << "    const float16_t *batch_b_ptr = " << input_b_str << " + i * " << params_->deep_ * params_->col_align_
+         << ";\n";
+    code << "    float16_t *batch_c_ptr = " << output_str << " + i * " << params_->row_ * params_->col_ << ";\n  ";
+    code.CodeFunction(target_ == kARM64 ? "MatmulBaseFp16Neon" : "MatMulFp16", "batch_a_ptr", "batch_b_ptr",
+                      "batch_c_ptr", bias_str, params_->act_type_, params_->deep_, params_->row_, params_->col_,
+                      params_->col_, OutType_Nhwc);
+  }
+  code << "  }\n";
+  context->AppendInitWeightSizeCode(w_buf_size);
+  context->AppendCode(code.str());
+  context->AppendInitCode(init_code.str());
+  return RET_OK;
+}
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.h
new file mode 100644
index 00000000..864f54ae
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.h
@@ -0,0 +1,58 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_MATMUL_FP16_BASE_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_MATMUL_FP16_BASE_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.h"
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "nnacl/matmul_parameter.h"
+
+namespace mindspore::lite::micro::nnacl {
+class MatMulFP16BaseCoder : public MatMulFP32BaseCoder {
+ public:
+  MatMulFP16BaseCoder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                      const LiteGraph::Node *node, size_t node_index, Target target)
+      : MatMulFP32BaseCoder(in_tensors, out_tensors, node, node_index, target) {}
+
+  ~MatMulFP16BaseCoder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+
+ private:
+  int InitBiasData() override;
+  int InitBufferA() override;
+  int InitBufferB() override;
+  std::string InitMatrixA(NNaclFp32Serializer *const code, NNaclFp32Serializer *const init_code,
+                          CoderContext *const context, size_t *w_buf);
+  std::string InitMatrixB(NNaclFp32Serializer *const code, NNaclFp32Serializer *const init_code,
+                          CoderContext *const context, size_t *w_buf);
+  int CollectFilesForTarget(CoderContext *const context) override;
+
+ protected:
+  virtual int InitAShape() = 0;
+  virtual int InitBShape() = 0;
+
+ protected:
+  int a_batch_ = 1;
+  int b_batch_ = 1;
+  int bias_count_ = 0;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_MATMUL_FP16_BASE_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.cc
new file mode 100644
index 00000000..26a3b923
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.cc
@@ -0,0 +1,79 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "coder/opcoders/nnacl/fp16/matmul_fp16_coder.h"
+#include <vector>
+#include "coder/log.h"
+#include "coder/opcoders/file_collector.h"
+
+using mindspore::schema::PrimitiveType_MatMulFusion;
+
+namespace mindspore::lite::micro::nnacl {
+int MatMulFP16Coder::InitAShape() {
+  std::vector<int> a_shape = input_tensor_->shape();
+  MS_CHECK_TRUE_MSG(a_shape.size() >= DIMENSION_2D, RET_ERROR, "A-metric tensor's shape is invalid.");
+  int batch = 1;
+  for (size_t i = 0; i < a_shape.size() - DIMENSION_2D; ++i) {
+    batch *= a_shape.at(i);
+  }
+  a_batch_ = batch;
+  params_->batch = batch;
+  params_->row_ = params_->a_transpose_ ? a_shape[a_shape.size() - C1NUM] : a_shape[a_shape.size() - C2NUM];
+  params_->deep_ = params_->a_transpose_ ? a_shape[a_shape.size() - C2NUM] : a_shape[a_shape.size() - C1NUM];
+  params_->row_16_ = UP_ROUND(params_->row_, row_tile_);
+  return RET_OK;
+}
+
+int MatMulFP16Coder::InitBShape() {
+  std::vector<int> b_shape = filter_tensor_->shape();
+  MS_CHECK_TRUE_MSG(b_shape.size() >= DIMENSION_2D, RET_ERROR, "B-metric tensor's shape is invalid.");
+  int batch = 1;
+  for (size_t i = 0; i < b_shape.size() - DIMENSION_2D; ++i) {
+    batch *= b_shape[i];
+  }
+  b_batch_ = batch;
+  params_->batch = batch;
+  params_->col_ = params_->b_transpose_ ? b_shape[b_shape.size() - C2NUM] : b_shape[b_shape.size() - C1NUM];
+  params_->col_8_ = UP_ROUND(params_->col_, C8NUM);
+  params_->deep_ = params_->b_transpose_ ? b_shape[b_shape.size() - C1NUM] : b_shape[b_shape.size() - C2NUM];
+  return RET_OK;
+}
+
+int MatMulFP16Coder::Prepare(CoderContext *const context) {
+  if (input_tensor_->data_type() != kNumberTypeFloat16) {
+    MS_LOG(INFO) << "Input tensor data type is invalid";
+    return RET_INPUT_PARAM_INVALID;
+  }
+  params_ = reinterpret_cast<MatMulParameter *>(parameter_);
+  MS_CHECK_TRUE_RET(input_tensors_.size() >= kBiasIndex, RET_ERROR);
+  filter_tensor_ = input_tensors_.at(kWeightIndex);
+  MS_CHECK_PTR(filter_tensor_);
+  if (input_tensors_.size() == kInputSize2) {
+    bias_tensor_ = input_tensors_.at(kBiasIndex);
+    MS_CHECK_PTR(bias_tensor_);
+    MS_CHECK_PTR(bias_tensor_->data());
+  }
+  params_->a_const_ = (input_tensor_->data() != nullptr);
+  params_->b_const_ = (filter_tensor_->data() != nullptr);
+  MS_CHECK_RET_CODE(MatMulFP16BaseCoder::Prepare(context), "MatMulFP16Coder prepare failed");
+  return RET_OK;
+}
+
+int MatMulFP16Coder::DoCode(CoderContext *const context) { return MatMulFP16BaseCoder::DoCode(context); }
+
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_MatMulFusion, CPUOpCoderCreator<MatMulFP16Coder>)
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_MatMulFusion, CPUOpCoderCreator<MatMulFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.h
new file mode 100644
index 00000000..3a1cb66a
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/matmul_fp16_coder.h
@@ -0,0 +1,44 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_MATMUL_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_MATMUL_FP16_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/nnacl/fp16/matmul_fp16_base_coder.h"
+#include "nnacl/matmul_parameter.h"
+
+namespace mindspore::lite::micro::nnacl {
+class MatMulFP16Coder final : public MatMulFP16BaseCoder {
+ public:
+  MatMulFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                  const LiteGraph::Node *node, size_t node_index, Target target)
+      : MatMulFP16BaseCoder(in_tensors, out_tensors, node, node_index, target) {
+    data_type_size_ = sizeof(uint16_t);
+  }
+
+  ~MatMulFP16Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+
+ private:
+  int InitAShape() override;
+  int InitBShape() override;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_MATMUL_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.cc
new file mode 100644
index 00000000..2f289085
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.cc
@@ -0,0 +1,75 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "coder/opcoders/nnacl/fp16/reduce_fp16_coder.h"
+#include "coder/opcoders/file_collector.h"
+
+using mindspore::schema::PrimitiveType_ReduceFusion;
+namespace mindspore::lite::micro::nnacl {
+int ReduceFP16Coder::Prepare(CoderContext *const context) {
+  MS_CHECK_RET_CODE(ReduceBaseCoder::Init(), "init failed");
+  data_type_ = ::kNumberTypeFloat16;
+  MS_CHECK_RET_CODE(ReduceBaseCoder::ReSize(), "resize failed");
+  MS_CHECK_RET_CODE(ReduceFP32Coder::MallocTmpBuffer(kNumberTypeFloat16), "malloc buffer failed");
+  return RET_OK;
+}
+
+int ReduceFP16Coder::DoCode(CoderContext *const context) {
+  Collect(context,
+          {
+            "nnacl/fp16/reduce_fp16.h",
+          },
+          {
+            "reduce_fp16.c",
+          });
+
+  // call the op function
+  switch (mode_) {
+    case static_cast<int>(schema::ReduceMode_ReduceSum): {
+      reduce_ = "ReduceSumFp16";
+      break;
+    }
+    case static_cast<int>(schema::ReduceMode_ReduceMean): {
+      reduce_ = "ReduceMeanFp16";
+      break;
+    }
+    case static_cast<int>(schema::ReduceMode_ReduceMax): {
+      reduce_ = "ReduceMaxFp16";
+      break;
+    }
+    case static_cast<int>(schema::ReduceMode_ReduceMin): {
+      reduce_ = "ReduceMinFp16";
+      break;
+    }
+    case static_cast<int>(schema::ReduceMode_ReduceProd): {
+      reduce_ = "ReduceProdFp16";
+      break;
+    }
+    case static_cast<int>(schema::ReduceMode_ReduceL2): {
+      reduce_ = "ReduceL2NormFp16";
+      break;
+    }
+    default:
+      MS_LOG(ERROR) << "Reduce unsupported reduce_ mode: " << mode_;
+      return RET_ERROR;
+  }
+  GenerateCode(context);
+  return RET_OK;
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_ReduceFusion, CPUOpCoderCreator<ReduceFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_ReduceFusion, CPUOpCoderCreator<ReduceFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.h
new file mode 100644
index 00000000..2fcf8fb4
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/reduce_fp16_coder.h
@@ -0,0 +1,40 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_REDUCE_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_REDUCE_FP16_CODER_H_
+
+#include <string>
+#include <vector>
+#include "coder/opcoders/nnacl/fp32/reduce_fp32_coder.h"
+#include "coder/opcoders/base/reduce_base_coder.h"
+#include "coder/opcoders/op_coder.h"
+
+namespace mindspore::lite::micro::nnacl {
+class ReduceFP16Coder final : public ReduceFP32Coder {
+ public:
+  ReduceFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                  const LiteGraph::Node *node, size_t node_index, Target target)
+      : ReduceFP32Coder(in_tensors, out_tensors, node, node_index, target) {}
+
+  ~ReduceFP16Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_REDUCE_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.cc
new file mode 100644
index 00000000..b6b07570
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.cc
@@ -0,0 +1,108 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "coder/opcoders/nnacl/fp16/resize_fp16_coder.h"
+#include <string>
+#include <map>
+#include <utility>
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/parallel.h"
+#include "coder/utils/common.h"
+#include "nnacl/fp32/resize_fp32.h"
+
+using mindspore::schema::PrimitiveType_Resize;
+
+namespace mindspore::lite::micro::nnacl {
+int ResizeFP16Coder::DataTypeLen() { return sizeof(uint16_t); }
+
+int ResizeFP16Coder::DoCode(CoderContext *const context) {
+  Collect(context,
+          {
+            "nnacl/fp16/resize_fp16.h",
+            "nnacl/fp32/resize_fp32.h",
+          },
+          {
+            "resize_fp16.c",
+            "resize_fp32.c",
+          });
+  nnacl::NNaclFp32Serializer code;
+  code.CodeArray("input_shape", input_tensor_->shape().data(), input_tensor_->shape().size(), true);
+  code.CodeArray("output_shape", output_tensor_->shape().data(), output_tensor_->shape().size(), true);
+  std::vector<uint16_t> y_weights(y_weight_len_);
+  Float32ToFp16(y_weights_, y_weights.data(), y_weight_len_);
+  std::vector<uint16_t> x_weights(x_weight_len_);
+  Float32ToFp16(x_weights_, x_weights.data(), x_weight_len_);
+  int unit = UP_DIV(new_height_, kDefaultThreadNum);
+  int h_begin = unit * kDefaultTaskId;
+  int h_end = std::min(h_begin + unit, new_height_);
+  int channel = input_tensor_->Channel();
+
+  switch (method_) {
+    case static_cast<int>(schema::ResizeMethod_LINEAR): {
+      code.CodeArray("y_bottoms", coordinate_.y_bottoms_, y_len_, true);
+      code.CodeArray("y_tops", coordinate_.y_tops_, y_len_, true);
+      code.CodeArray("x_lefts", coordinate_.x_lefts_, x_len_, true);
+      code.CodeArray("x_rights", coordinate_.x_rights_, x_len_, true);
+      code.CodeArray("y_weights", y_weights.data(), y_weight_len_, true);
+      code.CodeArray("x_weights", x_weights.data(), x_weight_len_, true);
+
+      code.CodeFunction("PrepareResizeBilinearFp16", "input_shape", "output_shape", calculate_str_, "(int *)y_bottoms",
+                        "(int *)y_tops", "(int *)x_lefts", "(int *)x_rights", "(float16_t *)y_weights",
+                        "(float16_t *)x_weights");
+      code << "    float16_t *line0 = (float16_t *)" << MemoryAllocator::GetInstance()->GetRuntimeAddr(line_buffer_)
+           << " + " << new_width_ << " * 2 * " << kDefaultTaskId << ";\n";
+      code << "    float16_t *line1 = line0 + " << new_width_ << " * " << channel << ";\n";
+      code.CodeFunction("ResizeBilinearFp16", input_tensor_, output_tensor_, "input_shape", "output_shape", "y_bottoms",
+                        "y_tops", "x_lefts", "x_rights", "(float16_t *)y_weights", "(float16_t *)x_weights", "line0",
+                        "line1", h_begin, h_end);
+      break;
+    }
+    case static_cast<int>(schema::ResizeMethod_NEAREST): {
+      code.CodeFunction("ResizeNearestNeighborFp16", input_tensor_, output_tensor_, "input_shape", "output_shape",
+                        calculate_str_, coordinate_transform_mode_, kDefaultTaskId, kDefaultThreadNum);
+      break;
+    }
+    case static_cast<int>(schema::ResizeMethod_CUBIC): {
+      code.CodeArray("y_tops", coordinate_.y_tops_, y_len_, true);
+      code.CodeArray("x_lefts", coordinate_.x_lefts_, x_len_, true);
+      code.CodeArray("y_weights", y_weights.data(), y_weight_len_, true);
+      code.CodeArray("x_weights", x_weights.data(), x_weight_len_, true);
+      auto resize_parameter = reinterpret_cast<ResizeParameter *>(parameter_);
+      MS_CHECK_PTR(resize_parameter);
+      auto cubic_coeff_str = "(float16_t)" + std::to_string(resize_parameter->cubic_coeff_);
+      code.CodeFunction("PrepareResizeBicubicFp16", "input_shape", "output_shape", calculate_str_, "(int *)y_tops",
+                        "(int *)x_lefts", "(float16_t *)y_weights", "(float16_t *)x_weights", cubic_coeff_str);
+      auto buffer_str = "(float16_t *)" + MemoryAllocator::GetInstance()->GetRuntimeAddr(line_buffer_) + " + " +
+                        std::to_string(new_width_ * channel * 4 * kDefaultTaskId);
+
+      code.CodeFunction("ResizeBicubicFp16", input_tensor_, output_tensor_, "input_shape", "output_shape", "y_tops",
+                        "x_lefts", "(float16_t *)y_weights", "(float16_t *)x_weights", buffer_str, h_begin, h_end);
+      break;
+    }
+    default: {
+      MS_LOG(ERROR) << "Resize unknown method " << method_;
+      return RET_ERROR;
+    }
+  }
+
+  context->AppendCode(code.str());
+  return RET_OK;
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Resize, CPUOpCoderCreator<ResizeFP16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Resize, CPUOpCoderCreator<ResizeFP16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.h
new file mode 100644
index 00000000..0a050f59
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/resize_fp16_coder.h
@@ -0,0 +1,41 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_RESIZE_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_RESIZE_FP16_CODER_H_
+
+#include "coder/opcoders/nnacl/fp32/resize_fp32_coder.h"
+#include <vector>
+#include <algorithm>
+#include <string>
+#include "include/errorcode.h"
+#include "src/runtime/kernel_exec.h"
+#include "nnacl/base/cast_base.h"
+
+namespace mindspore::lite::micro::nnacl {
+class ResizeFP16Coder : public ResizeFP32Coder {
+ public:
+  ResizeFP16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                  const LiteGraph::Node *node, size_t node_index, Target target)
+      : ResizeFP32Coder(in_tensors, out_tensors, node, node_index, target) {}
+  ~ResizeFP16Coder() override { FreeTmpBuffer(); };
+  int DoCode(CoderContext *const context) override;
+
+ private:
+  int DataTypeLen() override;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_RESIZE_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.cc
new file mode 100644
index 00000000..cddcac53
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.cc
@@ -0,0 +1,140 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "coder/opcoders/nnacl/fp16/transpose_fp16_coder.h"
+#include <vector>
+#include <unordered_set>
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/parallel.h"
+#include "coder/utils/common.h"
+
+using mindspore::schema::PrimitiveType_Transpose;
+namespace mindspore::lite::micro::nnacl {
+int TransposeFp16Coder::Prepare(CoderContext *const context) {
+  if (input_tensor_->data_type() != kNumberTypeFloat16) {
+    MS_LOG(INFO) << "Input tensor data type is invalid";
+    return lite::RET_INPUT_PARAM_INVALID;
+  }
+  MS_CHECK_RET_CODE(Init(), "init failed");
+  return RET_OK;
+}
+
+int TransposeFp16Coder::ResetStatus() {
+  param_->num_axes_ = 0;
+  if (input_tensors_.size() == C2NUM) {
+    param_->num_axes_ = input_tensors_[SECOND_INPUT]->ElementsNum();
+  }
+  auto in_shape = input_tensors_[FIRST_INPUT]->shape();
+  if (in_shape.size() > MAX_TRANSPOSE_DIM_SIZE) {
+    MS_LOG(ERROR) << "input shape out of range.";
+    return RET_ERROR;
+  }
+  int trans_nd[MAX_TRANSPOSE_DIM_SIZE] = {0, 2, 1};
+  int *perm_data{nullptr};
+  if (in_shape.size() != static_cast<size_t>(param_->num_axes_)) {
+    perm_data = trans_nd;
+    if (in_shape.size() == C3NUM && param_->num_axes_ == C4NUM) {
+      param_->num_axes_ = C3NUM;
+    }
+    if (param_->num_axes_ == 0) {
+      for (int i = 0; i < static_cast<int>(in_shape.size()); ++i) {
+        trans_nd[i] = static_cast<int>(in_shape.size()) - 1 - i;
+      }
+      param_->num_axes_ = static_cast<int>(in_shape.size());
+    }
+  } else {
+    MS_ASSERT(input_tensors_.size() == C2NUM);
+    auto perm_tensor = input_tensors_.at(SECOND_INPUT);
+    if (perm_tensor->data_type() != kNumberTypeInt32) {
+      MS_LOG(ERROR) << "Unsupported type id: " << perm_tensor->data_type() << " of perm tensor.";
+      return RET_ERROR;
+    }
+    perm_data = reinterpret_cast<int *>(perm_tensor->data());
+    MSLITE_CHECK_PTR(perm_data);
+    std::vector<int> perm(perm_data, perm_data + input_tensors_[SECOND_INPUT]->ElementsNum());
+    if (perm.size() != std::unordered_set<int>(perm.cbegin(), perm.cend()).size()) {
+      MS_LOG(ERROR) << "Invalid perm, the same element exits in perm.";
+      return RET_ERROR;
+    }
+  }
+  MS_CHECK_TRUE_MSG(param_->num_axes_ <= MAX_TRANSPOSE_DIM_SIZE, RET_ERROR, "transpose perm is invalid.");
+  for (int i = 0; i < param_->num_axes_; ++i) {
+    param_->perm_[i] = perm_data[i];
+  }
+  return RET_OK;
+}
+
+int TransposeFp16Coder::ComputeOfflineInfo() {
+  auto in_shape = input_tensor_->shape();
+  auto out_shape = output_tensor_->shape();
+  param_->strides_[param_->num_axes_ - 1] = 1;
+  param_->out_strides_[param_->num_axes_ - 1] = 1;
+  param_->data_num_ = input_tensor_->ElementsNum();
+  for (int i = param_->num_axes_ - 2; i >= 0; i--) {
+    param_->strides_[i] = in_shape.at(i + 1) * param_->strides_[i + 1];
+    param_->out_strides_[i] = out_shape.at(i + 1) * param_->out_strides_[i + 1];
+  }
+  return RET_OK;
+}
+
+int TransposeFp16Coder::Resize() {
+  auto ret = ResetStatus();
+  if (ret != RET_OK) {
+    MS_LOG(ERROR) << "Do transpose reset failed.";
+    return ret;
+  }
+  if (input_tensors_[FIRST_INPUT]->shape().size() != static_cast<size_t>(param_->num_axes_)) {
+    return RET_OK;
+  }
+  ret = ComputeOfflineInfo();
+  if (ret != RET_OK) {
+    MS_LOG(ERROR) << "Do compute transpose offline info failed.";
+    return ret;
+  }
+  thread_num_ = 1;
+  return RET_OK;
+}
+
+int TransposeFp16Coder::DoCode(CoderContext *const context) {
+  Collect(context,
+          {
+            "nnacl/transpose.h",
+            "nnacl/errorcode.h",
+            "nnacl/fp16/transpose_fp16.h",
+          },
+          {
+            "transpose_fp16.c",
+          });
+
+  NNaclFp32Serializer code;
+  if (input_tensor_->data() != output_tensor_->data()) {
+    code.CodeFunction("memcpy", output_tensor_, input_tensor_, input_tensor_->Size());
+    context->AppendCode(code.str());
+  }
+
+  auto out_shape = output_tensor_->shape();
+  dims_ = static_cast<int>(out_shape.size());
+  code.CodeArray("output_shape", out_shape.data(), dims_, true);
+  code.CodeStruct("trans_param", *param_);
+  code.CodeFunction("DoTransposeFp16", input_tensor_, output_tensor_, "output_shape", "&trans_param");
+  context->AppendCode(code.str());
+  return RET_OK;
+}
+
+REG_OPERATOR_CODER(kARM32, kNumberTypeFloat16, PrimitiveType_Transpose, CPUOpCoderCreator<TransposeFp16Coder>)
+REG_OPERATOR_CODER(kARM64, kNumberTypeFloat16, PrimitiveType_Transpose, CPUOpCoderCreator<TransposeFp16Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.h
new file mode 100644
index 00000000..240c470e
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp16/transpose_fp16_coder.h
@@ -0,0 +1,43 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_TRANSPOSE_FP16_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_TRANSPOSE_FP16_CODER_H_
+#include <vector>
+#include <string>
+#include "coder/opcoders/nnacl/fp32/transpose_fp32_coder.h"
+#include "nnacl/transpose.h"
+namespace mindspore::lite::micro::nnacl {
+class TransposeFp16Coder final : public TransposeFp32Coder {
+ public:
+  TransposeFp16Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                     const LiteGraph::Node *node, size_t node_index, Target target)
+      : TransposeFp32Coder(in_tensors, out_tensors, node, node_index, target) {}
+
+  ~TransposeFp16Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int Resize() override;
+
+  int DoCode(CoderContext *const context) override;
+
+ private:
+  int ResetStatus();
+  int ComputeOfflineInfo();
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP16_TRANSPOSE_FP16_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.cc
index 35fc1819..edc442e9 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.cc
@@ -14,9 +14,7 @@
  * limitations under the License.
  */
 #include "coder/opcoders/nnacl/fp32/activation_fp32_coder.h"
-#include <string>
 #include "nnacl/fp32/activation_fp32.h"
-#include "nnacl/op_base.h"
 #include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
 #include "coder/opcoders/file_collector.h"
 #include "coder/opcoders/parallel.h"
@@ -65,9 +63,15 @@ int ActivationFP32Coder::DoCode(CoderContext *const context) {
     case schema::ActivationType_HSWISH:
       code.CodeFunction("HSwish", input_tensor_, count, output_tensor_);
       break;
+    case schema::ActivationType_SWISH:
+      code.CodeFunction("Swish", input_tensor_, count, output_tensor_);
+      break;
     case schema::ActivationType_HSIGMOID:
       code.CodeFunction("HSigmoid", input_tensor_, count, output_tensor_);
       break;
+    case schema::ActivationType_ELU:
+      code.CodeFunction("Elu", input_tensor_, count, output_tensor_, activation_parameter->alpha_);
+      break;
     default:
       MS_LOG(ERROR) << "Activation type error";
       return RET_ERROR;
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.h
index 67be7e6d..f688d4bd 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/activation_fp32_coder.h
@@ -21,7 +21,7 @@
 #include "coder/opcoders/op_coder.h"

 namespace mindspore::lite::micro::nnacl {
-class ActivationFP32Coder final : public OperatorCoder {
+class ActivationFP32Coder : public OperatorCoder {
  public:
   ActivationFP32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                       const LiteGraph::Node *node, size_t node_index, Target target)
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.cc
index d7cc8726..49e53cf9 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.cc
@@ -27,8 +27,8 @@ std::string wrap_uint8(const std::string &a) { return "(uint8_t *)(" + a + ")";
 std::string wrap_offset(const std::string &a, int offset) { return "(" + a + "+" + std::to_string(offset) + ")"; }
 }  // namespace

-void ArithmeticFP32Coder::InitRunFunction(int primitive_type) {
-  ARITHMETIC_FUNC_INFO_FP32 fun_table[] = {
+void ArithmeticFP32Coder::InitFunTable() {
+  fun_table_ = {
     {PrimitiveType_MulFusion, schema::ActivationType_RELU, "ElementMulRelu", "ElementMulReluInt", "",
      "ElementOptMulRelu", "ElementOptMulReluInt"},
     {PrimitiveType_MulFusion, schema::ActivationType_RELU6, "ElementMulRelu6", "ElementMulRelu6Int", "",
@@ -63,21 +63,23 @@ void ArithmeticFP32Coder::InitRunFunction(int primitive_type) {
      "ElementOptModInt"},
     {PrimitiveType_SquaredDifference, schema::ActivationType_NO_ACTIVATION, "ElementSquaredDifference", "", "", "",
      ""}};
+}

-  size_t length = sizeof(fun_table) / sizeof(ARITHMETIC_FUNC_INFO_FP32);
-  for (size_t i = 0; i < length; i++) {
-    if (fun_table[i].primitive_type_ == primitive_type &&
-        fun_table[i].activation_type_ == arithmetic_parameter_->activation_type_) {
-      arithmetic_run_ = fun_table[i].func_;
-      arithmetic_run_int_ = fun_table[i].int_func_;
-      arithmetic_run_bool_ = fun_table[i].bool_func_;
-      arithmetic_opt_run_ = fun_table[i].opt_func_;
-      arithmetic_opt_run_int_ = fun_table[i].opt_int_func_;
+void ArithmeticFP32Coder::InitRunFunction(int primitive_type) {
+  InitFunTable();
+  for (size_t i = 0; i < fun_table_.size(); i++) {
+    if (fun_table_[i].primitive_type_ == primitive_type &&
+        fun_table_[i].activation_type_ == arithmetic_parameter_->activation_type_) {
+      arithmetic_run_ = fun_table_[i].func_;
+      arithmetic_run_int_ = fun_table_[i].int_func_;
+      arithmetic_run_bool_ = fun_table_[i].bool_func_;
+      arithmetic_opt_run_ = fun_table_[i].opt_func_;
+      arithmetic_opt_run_int_ = fun_table_[i].opt_int_func_;
     }
   }
   TypeId input_type_id = input_tensor_->data_type();
   data_type_len_ = lite::DataTypeSize(input_tensor_->data_type());
-  if (input_type_id == kNumberTypeFloat32 || input_type_id == kNumberTypeFloat) {
+  if (input_type_id == kNumberTypeFloat32 || input_type_id == kNumberTypeFloat || input_type_id == kNumberTypeFloat16) {
     arithmetic_func_type_ = kArithmeticFuncFloat;
   } else if (input_type_id == kNumberTypeBool) {
     arithmetic_func_type_ = kArithmeticFuncBool;
@@ -122,7 +124,8 @@ int ArithmeticFP32Coder::CheckDataType() {
 }

 void ArithmeticFP32Coder::ChooseArithmeticFunc(bool is_opt) {
-  if (input_tensor_->data_type() == kNumberTypeFloat32) {
+  if (input_tensor_->data_type() == kNumberTypeFloat32 || input_tensor_->data_type() == kNumberTypeFloat ||
+      input_tensor_->data_type() == kNumberTypeFloat16) {
     if (is_opt) {
       arithmetic_func_str_ = wrap_void(arithmetic_opt_run_);
     } else {
@@ -204,13 +207,8 @@ int ArithmeticFP32Coder::ConstTensorBroadCast(CoderContext *const context) {
   }
   FreeConstTileBuff();
   NNaclFp32Serializer init_code;
-  Collect(context,
-          {
-            "wrapper/fp32/arithmetic_fp32_wrapper.h",
-          },
-          {
-            "arithmetic_fp32_wrapper.c",
-          });
+  Collect(context, {"wrapper/fp32/arithmetic_fp32_wrapper.h", "nnacl/fp32/arithmetic_fp32.h"},
+          {"arithmetic_fp32_wrapper.c", "arithmetic_fp32.c"});
   if (input_tensor_->IsConst() &&
       arithmetic_parameter_->in_elements_num0_ != arithmetic_parameter_->out_elements_num_) {
     input0_ptr_ = reinterpret_cast<float *>(
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.h
index e1ec51fe..169ed457 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/arithmetic_fp32_coder.h
@@ -66,7 +66,7 @@ using mindspore::schema::PrimitiveType_Minimum;

 using mindspore::schema::PrimitiveType_Mod;

-class ArithmeticFP32Coder final : public OperatorCoder {
+class ArithmeticFP32Coder : public OperatorCoder {
   typedef struct {
     int primitive_type_;
     int activation_type_;
@@ -88,14 +88,7 @@ class ArithmeticFP32Coder final : public OperatorCoder {

   int DoCode(CoderContext *const context) override;

- private:
-  int ReSize(CoderContext *const context);
-
-  int ExecuteCode(const std::string &input0, const std::string &input1, const std::string &output, int size,
-                  bool is_opt, CoderContext *const context, NNaclFp32Serializer *const code);
-
-  void InitRunFunction(int primitive_type);
-
+ protected:
   int CheckDataType();

   void ChooseArithmeticFunc(bool is_opt);
@@ -108,6 +101,16 @@ class ArithmeticFP32Coder final : public OperatorCoder {

   void FreeConstTileBuff();

+  virtual void InitFunTable();
+
+  virtual int ReSize(CoderContext *const context);
+
+  virtual void InitRunFunction(int primitive_type);
+
+ private:
+  int ExecuteCode(const std::string &input0, const std::string &input1, const std::string &output, int size,
+                  bool is_opt, CoderContext *const context, NNaclFp32Serializer *const code);
+
   int ConstTensorBroadCast(CoderContext *const context);

   void ComputeInOutStrides();
@@ -121,7 +124,9 @@ class ArithmeticFP32Coder final : public OperatorCoder {

   void CollectFilesForFunc(CoderContext *const context);

- private:
+ protected:
+  std::vector<ARITHMETIC_FUNC_INFO_FP32> fun_table_;
+
   int break_pos_{0};

   int outside_{0};
@@ -148,10 +153,6 @@ class ArithmeticFP32Coder final : public OperatorCoder {

   Tensor *filter_tensor_{nullptr};

-  ArithmeticFuncType arithmetic_func_type_{kArithmeticFuncUnknow};
-
-  ArithmeticWrapperInfo arithmetic_wrapper_info_{};
-
   std::string input0_ptr_str_;

   std::string input1_ptr_str_;
@@ -169,6 +170,11 @@ class ArithmeticFP32Coder final : public OperatorCoder {
   std::string arithmetic_run_bool_;

   std::string arithmetic_func_str_;
+
+ private:
+  ArithmeticFuncType arithmetic_func_type_{kArithmeticFuncUnknow};
+
+  ArithmeticWrapperInfo arithmetic_wrapper_info_{};
 };
 }  // namespace mindspore::lite::micro::nnacl
 #endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_ARITHMETIC_FP32_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/concat_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/concat_fp32_coder.h
index 67607e13..6f3f5c71 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/concat_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/concat_fp32_coder.h
@@ -22,7 +22,7 @@
 #include "nnacl/concat_parameter.h"

 namespace mindspore::lite::micro::nnacl {
-class ConcatFP32Coder final : public OperatorCoder {
+class ConcatFP32Coder : public OperatorCoder {
  public:
   ConcatFP32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                   const LiteGraph::Node *node, size_t node_index, Target target)
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/exp_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/exp_fp32_coder.cc
index 65334f4b..e9bbca19 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/exp_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/exp_fp32_coder.cc
@@ -49,7 +49,7 @@ int ExpFP32Coder::DoCode(CoderContext *ctx) {
           });
   nnacl::NNaclFp32Serializer code;
   code.CodeStruct("exp_parameter", *exp_parameter_);
-  code.CodeFunction("exp", input_tensor_, output_tensor_, "(ExpParameter *)&exp_parameter", kDefaultTaskId);
+  code.CodeFunction("ExpFusionFp32", input_tensor_, output_tensor_, "(ExpParameter *)&exp_parameter", kDefaultTaskId);
   ctx->AppendCode(code.str());
   return RET_OK;
 }
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/gather_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/gather_fp32_coder.cc
index 087d4dde..3c31479c 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/gather_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/gather_fp32_coder.cc
@@ -94,4 +94,6 @@ int GatherFP32Coder::DoCode(CoderContext *context) {
 }

 REG_OPERATOR_CODER(kAllTargets, kNumberTypeFloat32, PrimitiveType_Gather, CPUOpCoderCreator<GatherFP32Coder>)
+REG_OPERATOR_CODER(kAllTargets, kNumberTypeInt32, PrimitiveType_Gather, CPUOpCoderCreator<GatherFP32Coder>)
+REG_OPERATOR_CODER(kAllTargets, kNumberTypeFloat16, PrimitiveType_Gather, CPUOpCoderCreator<GatherFP32Coder>)
 }  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.cc
new file mode 100644
index 00000000..992a58e4
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.cc
@@ -0,0 +1,81 @@
+/**
+ * Copyright 2023 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "coder/opcoders/nnacl/fp32/layernorm_fp32_coder.h"
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/parallel.h"
+
+using mindspore::schema::PrimitiveType_LayerNormFusion;
+
+namespace mindspore::lite::micro::nnacl {
+namespace {
+constexpr size_t kOutputNum = 3;
+}
+int LayerNormFP32Coder::Prepare(CoderContext *const context) {
+  param_ = reinterpret_cast<LayerNormParameter *>(parameter_);
+  param_->op_parameter_.thread_num_ = 1;
+  auto shape = input_tensor_->shape();
+  param_->begin_norm_axis_ = param_->begin_norm_axis_ >= 0 ? param_->begin_norm_axis_
+                                                           : param_->begin_norm_axis_ + static_cast<int>(shape.size());
+  param_->begin_params_axis_ = param_->begin_params_axis_ >= 0
+                                 ? param_->begin_params_axis_
+                                 : param_->begin_params_axis_ + static_cast<int>(shape.size());
+  MS_CHECK_LT(param_->begin_norm_axis_, static_cast<int>(shape.size()), RET_ERROR);
+  MS_CHECK_LT(param_->begin_params_axis_, static_cast<int>(shape.size()), RET_ERROR);
+  param_->norm_outer_size_ = 1;
+  for (int i = 0; i < param_->begin_norm_axis_; ++i) {
+    MS_CHECK_FALSE_MSG(INT_MUL_OVERFLOW(param_->norm_outer_size_, shape.at(i)), RET_ERROR, "mul overflow.");
+    param_->norm_outer_size_ *= shape.at(i);
+  }
+  param_->norm_inner_size_ = 1;
+  for (size_t i = param_->begin_norm_axis_; i < shape.size(); ++i) {
+    MS_CHECK_FALSE_MSG(INT_MUL_OVERFLOW(param_->norm_inner_size_, shape.at(i)), RET_ERROR, "mul overflow.");
+    param_->norm_inner_size_ *= shape.at(i);
+  }
+  param_->params_outer_size_ = 1;
+  for (int i = 0; i < param_->begin_params_axis_; ++i) {
+    MS_CHECK_FALSE_MSG(INT_MUL_OVERFLOW(param_->params_outer_size_, shape.at(i)), RET_ERROR, "mul overflow.");
+    param_->params_outer_size_ *= shape.at(i);
+  }
+  param_->params_inner_size_ = 1;
+  for (size_t i = param_->begin_params_axis_; i < shape.size(); ++i) {
+    MS_CHECK_FALSE_MSG(INT_MUL_OVERFLOW(param_->params_inner_size_, shape.at(i)), RET_ERROR, "mul overflow.");
+    param_->params_inner_size_ *= shape.at(i);
+  }
+  return RET_OK;
+}
+
+int LayerNormFP32Coder::DoCode(CoderContext *const context) {
+  NNaclFp32Serializer code;
+  code.CodeStruct("layer_norm_parm", *param_);
+  Collect(context, {"nnacl/fp32/layer_norm_fp32.h"}, {"layer_norm_fp32.c"});
+  if (output_tensors_.size() == kOutputNum) {
+    code.CodeFunction("LayerNorm", input_tensor_, input_tensors_.at(SECOND_INPUT), input_tensors_.at(THIRD_INPUT),
+                      output_tensor_, output_tensors_.at(SECOND_INPUT), output_tensors_.at(THIRD_INPUT),
+                      "&layer_norm_parm", 0);
+  } else if (output_tensors_.size() == 1) {
+    code.CodeFunction("LayerNorm", input_tensor_, input_tensors_.at(SECOND_INPUT), input_tensors_.at(THIRD_INPUT),
+                      output_tensor_, "NULL", "NULL", "&layer_norm_parm", 0);
+  } else {
+    return RET_ERROR;
+  }
+  context->AppendCode(code.str());
+  return RET_OK;
+}
+
+REG_OPERATOR_CODER(kAllTargets, kNumberTypeFloat32, PrimitiveType_LayerNormFusion,
+                   CPUOpCoderCreator<LayerNormFP32Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.h
new file mode 100644
index 00000000..a14cff57
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/layernorm_fp32_coder.h
@@ -0,0 +1,40 @@
+/**
+ * Copyright 2022 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_LAYERNORM_FP32_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_LAYERNORM_FP32_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/op_coder.h"
+#include "nnacl/layer_norm_parameter.h"
+
+namespace mindspore::lite::micro::nnacl {
+class LayerNormFP32Coder : public OperatorCoder {
+ public:
+  LayerNormFP32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                     const LiteGraph::Node *node, size_t node_index, Target target)
+      : OperatorCoder(in_tensors, out_tensors, node, node_index, target) {}
+  ~LayerNormFP32Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+
+ protected:
+  LayerNormParameter *param_;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_LAYERNORM_FP32_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/lstm_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/lstm_fp32_coder.cc
index 3bc8ea4b..561f6259 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/lstm_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/lstm_fp32_coder.cc
@@ -75,13 +75,6 @@ int LstmFP32Coder::InitStateWeightBias(CoderContext *const context) {
     w_buf_size += weight_h_size;
     init_code.CodeFunction("PackLstmWeight", weight_h_ptr_, weight_h, weight_batch_, lstm_param_->hidden_size_,
                            lstm_param_->hidden_size_, lstm_param_->state_col_align_, "NULL");
-  } else {
-    size_t weight_h_size = weight_h->Size();
-    weight_h_ptr_ =
-      reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, weight_h->Size(), kOfflinePackWeight));
-    MS_CHECK_PTR(weight_h_ptr_);
-    MS_CHECK_RET_CODE(memcpy_s(weight_h_ptr_, weight_h_size, weight_h->data(), weight_h_size),
-                      "copy weight h data failed");
   }

   state_bias_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, kOnlineSize, kOnlinePackWeight));
@@ -214,8 +207,15 @@ int LstmFP32Coder::DoCode(CoderContext *context) {
   code.CodeArray("buffer", buffers_addr.data(), buffers_addr.size(), false);
   code.CodeFunction("memcpy", output_hidden_state, hidden_state, hidden_state->Size());
   code.CodeFunction("memcpy", output_cell_state, cell_state, cell_state->Size());
-  code.CodeFunction("Lstm", output_tensor_, input_tensor_, weight_i_ptr_, weight_h_ptr_, input_bias_, state_bias_,
-                    output_hidden_state, output_cell_state, "buffer", "&lstm_param");
+  if (weight_h_ptr_ != nullptr) {
+    code.CodeFunction("Lstm", output_tensor_, input_tensor_, weight_i_ptr_, weight_h_ptr_, input_bias_, state_bias_,
+                      output_hidden_state, output_cell_state, "buffer", "&lstm_param");
+  } else {
+    auto *weight_h_tensor = input_tensors().at(kInputSize1);
+    auto weight_h = allocator_->GetRuntimeAddr(weight_h_tensor, weight_h_tensor->IsConst());
+    code.CodeFunction("Lstm", output_tensor_, input_tensor_, weight_i_ptr_, weight_h, input_bias_, state_bias_,
+                      output_hidden_state, output_cell_state, "buffer", "&lstm_param");
+  }
   context->AppendCode(code.str());
   return RET_OK;
 }
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.cc
index 26707a3e..790a142e 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.cc
@@ -55,7 +55,8 @@ int MatMulFP32BaseCoder::InitBiasData() {
       is_bias_broadcast_ = true;
     }
     ori_bias_pack_ptr_size_ = bias_tensor_->ElementsNum() * sizeof(float);
-    bias_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, kOnlineSize, kOnlinePackWeight));
+    bias_ptr_ = allocator_->Malloc(kNumberTypeFloat32, kOnlineSize, kOnlinePackWeight,
+                                   bias_tensor_->tensor_name() + "_online_pack");
     MS_CHECK_PTR(bias_ptr_);
   }
   return RET_OK;
@@ -84,7 +85,14 @@ int MatMulFP32BaseCoder::InitBufferA() {
   }
   a_pack_ptr_size_ = static_cast<size_t>(params_->batch * params_->row_align_ * params_->deep_ * sizeof(float));
   if (params_->a_const_) {
-    a_pack_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, kOnlineSize, kOnlinePackWeight));
+    a_pack_ptr_ = reinterpret_cast<float *>(allocator_->GetSharedWeightAddr(input_tensors_.at(0)));
+    if (a_pack_ptr_ == nullptr) {
+      a_pack_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, kOnlineSize, kOnlinePackWeight,
+                                                                 input_tensors_.at(0)->tensor_name() + "_online_pack"));
+      allocator_->MarkSharedWeight(input_tensors_.at(0), a_pack_ptr_);
+    } else {
+      a_packed_ = true;
+    }
   } else {
     a_pack_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, a_pack_ptr_size_, kWorkspace));
   }
@@ -96,23 +104,30 @@ int MatMulFP32BaseCoder::InitBufferB() {
   if (b_pack_ptr_ != nullptr) {
     return RET_OK;
   }
-  b_pack_ptr_size_ = static_cast<size_t>(params_->batch * params_->col_align_ * params_->deep_ * sizeof(float));
+  b_pack_ptr_size_ = static_cast<size_t>(params_->batch * params_->col_align_ * params_->deep_ * data_type_size_);
   if (params_->b_const_) {
-    b_pack_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, kOnlineSize, kOnlinePackWeight));
+    b_pack_ptr_ = reinterpret_cast<float *>(allocator_->GetSharedWeightAddr(input_tensors_.at(1)));
+    if (b_pack_ptr_ == nullptr) {
+      b_pack_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeUInt8, b_pack_ptr_size_, kOnlinePackWeight,
+                                                                 input_tensors_.at(1)->tensor_name() + "_online_pack"));
+      allocator_->MarkSharedWeight(input_tensors_.at(1), b_pack_ptr_);
+    } else {
+      b_packed_ = true;
+    }
   } else {
-    b_pack_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, b_pack_ptr_size_, kWorkspace));
+    b_pack_ptr_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeUInt8, b_pack_ptr_size_, kWorkspace));
   }
   MS_CHECK_PTR(b_pack_ptr_);
   return RET_OK;
 }

 int MatMulFP32BaseCoder::InitMatrixA(const float *src_ptr) {
-  ::InitMatrixA(src_ptr, a_pack_ptr_, params_, vec_matmul_);
+  ::InitMatrixA(src_ptr, static_cast<float *>(a_pack_ptr_), params_, vec_matmul_);
   return RET_OK;
 }

 int MatMulFP32BaseCoder::InitMatrixB(const float *src_ptr) {
-  ::InitMatrixB(src_ptr, b_pack_ptr_, params_, vec_matmul_);
+  ::InitMatrixB(src_ptr, static_cast<float *>(b_pack_ptr_), params_, vec_matmul_);
   return RET_OK;
 }

@@ -179,12 +194,11 @@ int MatMulFP32BaseCoder::DoCode(CoderContext *const context) {
   NNaclFp32Serializer code, init_code;
   size_t w_buf_size = 0;
   std::string param_name = "mat_mul_parameter";
-
+  std::string bias_ptr_str = "((float *)(" + allocator_->GetRuntimeAddr(bias_ptr_) + "))";
   code.CodeStruct(param_name, *params_);
   if (support_parallel_) {
     code << "    " << param_name << ".op_parameter_.thread_num_ = 1;\n";
   }
-  init_code.CodeStruct("mat_mul_parameter", *params_);
   // do bias packing to init
   if (input_tensors_.size() == DIMENSION_3D) {
     init_code.CodeBufferOffsetExpression(bias_ptr_, context->weight_name(), context->weight_offset_name(),
@@ -193,7 +207,6 @@ int MatMulFP32BaseCoder::DoCode(CoderContext *const context) {
     int max_bias_data = params_->col_align_;
     if (is_bias_broadcast_) {
       float broad_cast_data = (reinterpret_cast<float *>(bias_tensor_->data()))[0];
-      std::string bias_ptr_str = "((float *)(" + allocator_->GetRuntimeAddr(bias_ptr_) + "))";
       init_code << "\t    for (int i = 0; i < " << max_bias_data << "; ++i) {\n";
       init_code << "\t\t    " << bias_ptr_str << "[i] = " << broad_cast_data << ";\n";
       init_code << "   }\n";
@@ -209,44 +222,43 @@ int MatMulFP32BaseCoder::DoCode(CoderContext *const context) {
   std::string a_pack_str = allocator_->GetRuntimeAddr(a_pack_ptr_);
   std::string b_pack_str = allocator_->GetRuntimeAddr(b_pack_ptr_);
   // do const value packing to init
-  if (!params_->a_const_) {
-    code.CodeFunction("InitMatrixA", input_tensor_, a_pack_ptr_, "&mat_mul_parameter", vec_matmul_);
-    if (!params_->b_const_) {
-      init_code.CodeMallocExpression(b_pack_ptr_, b_pack_ptr_size_);
-      init_code.CodeFunction("memset", b_pack_ptr_, 0, b_pack_ptr_size_);
-    } else {
-      init_code.CodeBufferOffsetExpression(b_pack_ptr_, context->weight_name(), context->weight_offset_name(),
-                                           context->weight_size_name(), b_pack_ptr_size_);
-      w_buf_size += b_pack_ptr_size_;
-    }
-    std::string b_src_str = b_str;
-    if (de_quant_flag_) {
-      // reuse to b_pack_str
-      b_src_str = Dequant::GetInstance()->de_quant_buffer_str();
-      std::string de_quant_function = Dequant::GetInstance()->GetMicroDeQuantFunction(filter_tensor_, b_str);
-      init_code << de_quant_function;
-    }
-    // b_pack_str has been memset, no need to memset
-    init_code.CodeFunction("InitMatrixB", b_src_str, b_pack_ptr_, "&mat_mul_parameter", vec_matmul_);
+  if ((params_->a_const_ && !a_packed_) || (params_->b_const_ && !b_packed_)) {
+    init_code.CodeStruct("mat_mul_parameter", *params_);
   }
-  if (!params_->b_const_) {
-    if (!params_->a_const_) {
-      init_code.CodeMallocExpression(a_pack_str, a_pack_ptr_size_);
-      init_code.CodeFunction("memset", a_pack_ptr_, 0, a_pack_ptr_size_);
-    } else {
+  if (params_->a_const_) {
+    if (!a_packed_) {
       init_code.CodeBufferOffsetExpression(a_pack_ptr_, context->weight_name(), context->weight_offset_name(),
                                            context->weight_size_name(), a_pack_ptr_size_);
       w_buf_size += a_pack_ptr_size_;
+      std::string a_src_str = a_str;
+      if (de_quant_flag_) {
+        // reuse to a_pack_str
+        a_src_str = Dequant::GetInstance()->de_quant_buffer_str();
+        std::string de_quant_function = Dequant::GetInstance()->GetMicroDeQuantFunction(input_tensor_, a_str);
+        init_code << de_quant_function;
+      }
+      // a_pack_str has been memset, no need to memset
+      init_code.CodeFunction("InitMatrixA", a_src_str, a_pack_ptr_, "&mat_mul_parameter", vec_matmul_);
     }
-    std::string a_src_str = a_str;
-    if (de_quant_flag_) {
-      // reuse to a_pack_str
-      a_src_str = Dequant::GetInstance()->de_quant_buffer_str();
-      std::string de_quant_function = Dequant::GetInstance()->GetMicroDeQuantFunction(input_tensor_, a_str);
-      init_code << de_quant_function;
+  } else {
+    code.CodeFunction("InitMatrixA", input_tensor_, a_pack_ptr_, "&mat_mul_parameter", vec_matmul_);
+  }
+  if (params_->b_const_) {
+    if (!b_packed_) {
+      init_code.CodeBufferOffsetExpression(b_pack_ptr_, context->weight_name(), context->weight_offset_name(),
+                                           context->weight_size_name(), b_pack_ptr_size_);
+      w_buf_size += b_pack_ptr_size_;
+      std::string b_src_str = b_str;
+      if (de_quant_flag_) {
+        // reuse to b_pack_str
+        b_src_str = Dequant::GetInstance()->de_quant_buffer_str();
+        std::string de_quant_function = Dequant::GetInstance()->GetMicroDeQuantFunction(filter_tensor_, b_str);
+        init_code << de_quant_function;
+      }
+      // b_pack_str has been memset, no need to memset
+      init_code.CodeFunction("InitMatrixB", b_src_str, b_pack_ptr_, "&mat_mul_parameter", vec_matmul_);
     }
-    // a_pack_str has been memset, no need to memset
-    init_code.CodeFunction("InitMatrixA", a_src_str, a_pack_ptr_, "&mat_mul_parameter", vec_matmul_);
+  } else {
     code.CodeFunction("InitMatrixB", filter_tensor_, b_pack_ptr_, "&mat_mul_parameter", vec_matmul_);
   }
   int current_stride_oc = thread_stride_ * col_tile_;
@@ -257,18 +269,18 @@ int MatMulFP32BaseCoder::DoCode(CoderContext *const context) {
   if (vec_matmul_) {
     code << "      const float *batch_a_ptr = " << a_pack_str << " + i * " << params_->deep_ << ";\n";
     code << "      const float *batch_b_ptr = " << b_pack_str << " + i * " << params_->deep_ * params_->col_ << ";\n";
-    code << "      float *batch_c_ptr = " << c_str << " + i * " << params_->row_ * params_->col_ << ";\n";
+    code << "      float *batch_c_ptr = " << c_str << " + i * " << params_->row_ * params_->col_ << ";\n  ";

-    code.CodeFunction("MatVecMulFp32", "batch_a_ptr", "batch_b_ptr", "batch_c_ptr", bias_ptr_, params_->act_type_,
+    code.CodeFunction("MatVecMulFp32", "batch_a_ptr", "batch_b_ptr", "batch_c_ptr", bias_ptr_str, params_->act_type_,
                       params_->deep_, cur_oc);
   } else {
     code << "      const float *batch_a_ptr = " << a_pack_str << " + i * " << params_->row_align_ * params_->deep_
          << ";\n";
     code << "      const float *batch_b_ptr = " << b_pack_str << " + i * " << params_->deep_ * params_->col_align_
          << ";\n";
-    code << "      float *batch_c_ptr = " << c_str << " + i * " << params_->row_ * params_->col_ << ";\n";
+    code << "      float *batch_c_ptr = " << c_str << " + i * " << params_->row_ * params_->col_ << ";\n  ";

-    code.CodeFunction("MatMulOpt", "batch_a_ptr", "batch_b_ptr", "batch_c_ptr", bias_ptr_, params_->act_type_,
+    code.CodeFunction("MatMulOpt", "batch_a_ptr", "batch_b_ptr", "batch_c_ptr", bias_ptr_str, params_->act_type_,
                       params_->deep_, params_->row_, cur_oc, params_->col_, "OutType_Nhwc");
   }
   code << "    }\n";
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.h
index 4f35254d..68b2658a 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/matmul_fp32_base_coder.h
@@ -36,30 +36,30 @@ class MatMulFP32BaseCoder : public OperatorCoder {

   virtual int ReSize();

+ protected:
+  virtual void ResizeParameter();
+  virtual int InitBiasData();
+  virtual int InitBufferA();
+  virtual int InitBufferB();
+  virtual int CollectFilesForTarget(CoderContext *const context);
+  virtual int Init();
+  virtual void InitParameter();
+
  private:
-  void ResizeParameter();
-  int InitBiasData();
-  int InitBufferA();
-  int InitBufferB();
   int InitMatrixA(const float *src_ptr);
   int InitMatrixB(const float *src_ptr);
-  int CollectFilesForTarget(CoderContext *const context);
-
- protected:
-  virtual int Init();
-  void InitParameter();

  protected:
   Tensor *filter_tensor_{nullptr};
   Tensor *bias_tensor_{nullptr};
   MatMulParameter *params_{nullptr};
-  float *a_pack_ptr_ = nullptr;
-  float *b_pack_ptr_ = nullptr;
-  float *bias_ptr_{nullptr};
+  void *a_pack_ptr_ = nullptr;
+  void *b_pack_ptr_ = nullptr;
+  void *bias_ptr_{nullptr};
   bool vec_matmul_{false};
   bool de_quant_flag_{false};
-
- private:
+  bool a_packed_{false};
+  bool b_packed_{false};
   int col_tile_{0};
   int row_tile_{0};
   int thread_stride_{0};
@@ -69,6 +69,7 @@ class MatMulFP32BaseCoder : public OperatorCoder {
   size_t a_pack_ptr_size_{0};
   size_t b_pack_ptr_size_{0};
   bool is_bias_broadcast_{false};
+  size_t data_type_size_{C4NUM};
 };
 }  // namespace mindspore::lite::micro::nnacl
 #endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_MATMUL_FP32_BASE_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/pooling_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/pooling_fp32_coder.h
index df08dcbe..9f4e0026 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/pooling_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/pooling_fp32_coder.h
@@ -21,7 +21,7 @@
 #include "coder/opcoders/op_coder.h"

 namespace mindspore::lite::micro::nnacl {
-class PoolingFP32Coder final : public OperatorCoder {
+class PoolingFP32Coder : public OperatorCoder {
  public:
   PoolingFP32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                    const LiteGraph::Node *node, size_t node_index, Target target)
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.cc
index 661881af..11e8a3ec 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.cc
@@ -16,7 +16,6 @@

 #include "coder/opcoders/nnacl/fp32/reduce_fp32_coder.h"
 #include <string>
-#include "coder/log.h"
 #include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
 #include "coder/opcoders/file_collector.h"

@@ -25,14 +24,14 @@ namespace mindspore::lite::micro::nnacl {
 int ReduceFP32Coder::Prepare(CoderContext *const context) {
   MS_CHECK_RET_CODE(ReduceBaseCoder::Init(), "init failed");
   MS_CHECK_RET_CODE(ReSize(), "resize failed");
-  MS_CHECK_RET_CODE(MallocTmpBuffer(), "malloc buffer failed");
+  MS_CHECK_RET_CODE(MallocTmpBuffer(kNumberTypeFloat32), "malloc buffer failed");
   return RET_OK;
 }

-int ReduceFP32Coder::MallocTmpBuffer() {
+int ReduceFP32Coder::MallocTmpBuffer(mindspore::TypeId type_id) {
   data_buffers_.clear();
   for (auto size : buffer_sizes_) {
-    auto *buffer = static_cast<float *>(allocator_->Malloc(kNumberTypeFloat, size * sizeof(float), kWorkspace));
+    auto *buffer = static_cast<float *>(allocator_->Malloc(type_id, size * lite::DataTypeSize(type_id), kWorkspace));
     MS_CHECK_PTR(buffer);
     data_buffers_.emplace_back(buffer);
   }
@@ -57,41 +56,42 @@ int ReduceFP32Coder::DoCode(CoderContext *const context) {
             "reduce_fp32.c",
           });

-  NNaclFp32Serializer code;
   // call the op function
-  std::string reduce;
-  std::string int_reduce;
   switch (mode_) {
     case static_cast<int>(schema::ReduceMode_ReduceSum): {
-      reduce = "ReduceSum";
+      reduce_ = "ReduceSum";
       break;
     }
     case static_cast<int>(schema::ReduceMode_ReduceMean): {
-      reduce = "ReduceMean";
+      reduce_ = "ReduceMean";
       break;
     }
     case static_cast<int>(schema::ReduceMode_ReduceMax): {
-      reduce = "ReduceMax";
+      reduce_ = "ReduceMax";
       break;
     }
     case static_cast<int>(schema::ReduceMode_ReduceMin): {
-      reduce = "ReduceMin";
+      reduce_ = "ReduceMin";
       break;
     }
     case static_cast<int>(schema::ReduceMode_ReduceProd): {
-      reduce = "ReduceProd";
-      int_reduce = "IntReduceProd";
+      reduce_ = "ReduceProd";
+      int_reduce_ = "IntReduceProd";
       break;
     }
     case static_cast<int>(schema::ReduceMode_ReduceSumSquare): {
-      reduce = "ReduceSumSquare";
+      reduce_ = "ReduceSumSquare";
       break;
     }
     default:
-      MS_LOG(ERROR) << "Reduce unsupported reduce mode: " << mode_;
+      MS_LOG(ERROR) << "Reduce unsupported reduce_ mode: " << mode_;
       return RET_ERROR;
   }
-
+  GenerateCode(context);
+  return RET_OK;
+}
+void ReduceFP32Coder::GenerateCode(CoderContext *const context) {
+  NNaclFp32Serializer code;
   std::string src_addr = allocator_->GetRuntimeAddr(input_tensor_);
   std::string dst_addr;
   for (int i = 0; i < num_axes_; ++i) {
@@ -103,16 +103,16 @@ int ReduceFP32Coder::DoCode(CoderContext *const context) {
     outer_size_ = outer_sizes_.at(i);
     inner_size_ = inner_sizes_.at(i);
     axis_size_ = axis_sizes_.at(i);
-    if (data_type_ == ::kNumberTypeFloat32) {
-      code.CodeFunction(reduce, outer_size_, inner_size_, axis_size_, src_addr, dst_addr, 0, thread_num_);
+    if (data_type_ == ::kNumberTypeInt32) {
+      code.CodeFunction(int_reduce_, outer_size_, inner_size_, axis_size_, src_addr, dst_addr, 0, thread_num_);
     } else {
-      code.CodeFunction(int_reduce, outer_size_, inner_size_, axis_size_, src_addr, dst_addr, 0, thread_num_);
+      code.CodeFunction(reduce_, outer_size_, inner_size_, axis_size_, src_addr, dst_addr, 0, thread_num_);
     }
     src_addr = dst_addr;
   }
   context->AppendCode(code.str());
-  return RET_OK;
 }

 REG_OPERATOR_CODER(kAllTargets, kNumberTypeFloat32, PrimitiveType_ReduceFusion, CPUOpCoderCreator<ReduceFP32Coder>)
+REG_OPERATOR_CODER(kAllTargets, kNumberTypeInt32, PrimitiveType_ReduceFusion, CPUOpCoderCreator<ReduceFP32Coder>)
 }  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.h
index a62f35ec..5b9ccd2b 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/reduce_fp32_coder.h
@@ -23,7 +23,7 @@
 #include "coder/opcoders/op_coder.h"

 namespace mindspore::lite::micro::nnacl {
-class ReduceFP32Coder final : public ReduceBaseCoder {
+class ReduceFP32Coder : public ReduceBaseCoder {
  public:
   ReduceFP32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                   const LiteGraph::Node *node, size_t node_index, Target target)
@@ -35,11 +35,17 @@ class ReduceFP32Coder final : public ReduceBaseCoder {

   int DoCode(CoderContext *const context) override;

- private:
-  int ReSize() override;
-  int MallocTmpBuffer();
+ protected:
+  void GenerateCode(CoderContext *const context);
+  int MallocTmpBuffer(mindspore::TypeId type_id);
+
+  std::string reduce_;
+  std::string int_reduce_;
   TypeIdC data_type_{::kNumberTypeFloat32};
   std::vector<float *> data_buffers_;
+
+ private:
+  int ReSize() override;
 };
 }  // namespace mindspore::lite::micro::nnacl
 #endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_REDUCE_FP32_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.cc
index a5acf689..d84d0c60 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.cc
@@ -68,7 +68,9 @@ int ResizeFP32Coder::ReSize() {
   }

   MS_CHECK_RET_CODE_WITH_EXE(MallocTmpBuffer(), "MallocTmpBuffer failed", FreeTmpBuffer());
-  MS_CHECK_RET_CODE_WITH_EXE(ResizePrepare(), "ResizePrepare failed", FreeTmpBuffer());
+  if (input_tensor_->data_type() == kNumberTypeFloat32 || input_tensor_->data_type() == kNumberTypeFloat) {
+    MS_CHECK_RET_CODE_WITH_EXE(ResizePrepare(), "ResizePrepare failed", FreeTmpBuffer());
+  }

   return RET_OK;
 }
@@ -128,8 +130,8 @@ int ResizeFP32Coder::MallocTmpBuffer() {
   }

   {
-    size_t line_buffer_size = sizeof(float) * x_len_ * input_tensor_->Channel() * kTwo * kMaxThreadNumSupported;
-    line_buffer_ = reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, line_buffer_size, kWorkspace));
+    size_t line_buffer_size = DataTypeLen() * x_len_ * input_tensor_->Channel() * kTwo * kMaxThreadNumSupported;
+    line_buffer_ = allocator_->Malloc(kNumberTypeUInt8, line_buffer_size, kWorkspace);
     CHECK_MALLOC_RES(line_buffer_, RET_NULL_PTR);
   }
   return RET_OK;
@@ -168,12 +170,12 @@ int ResizeFP32Coder::DoCode(CoderContext *const context) {

   switch (method_) {
     case static_cast<int>(schema::ResizeMethod_LINEAR): {
-      code.CodeArray("y_bottoms", coordinate_.y_bottoms_, sizeof(int) * y_len_, true);
-      code.CodeArray("y_tops", coordinate_.y_tops_, sizeof(int) * y_len_, true);
-      code.CodeArray("x_lefts", coordinate_.x_lefts_, sizeof(int) * x_len_, true);
-      code.CodeArray("x_rights", coordinate_.x_rights_, sizeof(int) * x_len_, true);
-      code.CodeArray("y_weights", y_weights_, sizeof(float) * y_weight_len_, true);
-      code.CodeArray("x_weights", x_weights_, sizeof(float) * x_weight_len_, true);
+      code.CodeArray("y_bottoms", coordinate_.y_bottoms_, y_len_, true);
+      code.CodeArray("y_tops", coordinate_.y_tops_, y_len_, true);
+      code.CodeArray("x_lefts", coordinate_.x_lefts_, x_len_, true);
+      code.CodeArray("x_rights", coordinate_.x_rights_, x_len_, true);
+      code.CodeArray("y_weights", y_weights_, y_weight_len_, true);
+      code.CodeArray("x_weights", x_weights_, x_weight_len_, true);

       int c = input_tensor_->shape().at(kNHWC_C);
       code << "float *line0 = " << MemoryAllocator::GetInstance()->GetRuntimeAddr(line_buffer_) << ";\n";
@@ -188,12 +190,13 @@ int ResizeFP32Coder::DoCode(CoderContext *const context) {
       break;
     }
     case static_cast<int>(schema::ResizeMethod_CUBIC): {
-      code.CodeArray("y_tops", coordinate_.y_tops_, sizeof(int) * y_len_, true);
-      code.CodeArray("x_lefts", coordinate_.x_lefts_, sizeof(int) * x_len_, true);
-      code.CodeArray("y_weights", y_weights_, sizeof(float) * y_weight_len_, true);
-      code.CodeArray("x_weights", x_weights_, sizeof(float) * x_weight_len_, true);
+      code.CodeArray("y_tops", coordinate_.y_tops_, y_len_, true);
+      code.CodeArray("x_lefts", coordinate_.x_lefts_, x_len_, true);
+      code.CodeArray("y_weights", y_weights_, y_weight_len_, true);
+      code.CodeArray("x_weights", x_weights_, x_weight_len_, true);
+      auto buffer_str = "(float *)" + MemoryAllocator::GetInstance()->GetRuntimeAddr(line_buffer_);
       code.CodeFunction("ResizeBicubic", input_tensor_, output_tensor_, "input_shape", "output_shape", "y_tops",
-                        "x_lefts", "y_weights", "x_weights", line_buffer_, 0, new_height_);
+                        "x_lefts", "y_weights", "x_weights", buffer_str, 0, new_height_);
       break;
     }
     default: {
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.h
index 54594c62..34dffd50 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/resize_fp32_coder.h
@@ -27,7 +27,7 @@
 #include "src/runtime/kernel/cpu/fp32/resize_fp32.h"

 namespace mindspore::lite::micro::nnacl {
-class ResizeFP32Coder final : public ResizeBaseCoder {
+class ResizeFP32Coder : public ResizeBaseCoder {
  public:
   ResizeFP32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                   const LiteGraph::Node *node, size_t node_index, Target target)
@@ -37,12 +37,12 @@ class ResizeFP32Coder final : public ResizeBaseCoder {
   int ReSize();
   int DoCode(CoderContext *const context) override;

- private:
+ protected:
   int SelectCalculatorFunc();
   void CalTmpBufferLen();
   int MallocTmpBuffer();
   void FreeTmpBuffer();
-  int ResizePrepare();
+  virtual int DataTypeLen() { return sizeof(float); }

   ResizeCoordinate coordinate_;
   size_t x_len_{0};
@@ -52,9 +52,12 @@ class ResizeFP32Coder final : public ResizeBaseCoder {

   float *y_weights_{nullptr};
   float *x_weights_{nullptr};
-  float *line_buffer_{nullptr};
+  void *line_buffer_{nullptr};
   CalculateOriginalCoordinate calculate_{nullptr};
   std::string calculate_str_;
+
+ private:
+  int ResizePrepare();
 };
 }  // namespace mindspore::lite::micro::nnacl
 #endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_RESIZE_FP32_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.cc
index ae28fe2a..9375a71a 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.cc
@@ -28,36 +28,14 @@ int ScaleFP32Coder::InitScaleOffset() {
   MS_CHECK_PTR(scale_tensor);
   if (scale_tensor->data() != nullptr) {
     scale_param_->const_scale_ = true;
-    scale_ =
-      reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, scale_tensor->Size(), kOfflinePackWeight));
-    MS_CHECK_PTR(scale_);
-    MS_CHECK_TRUE(scale_tensor->Size() > 0, "invalid scale tensor size");
-    MS_CHECK_RET_CODE(memcpy_s(scale_, scale_tensor->Size(), scale_tensor->data(), scale_tensor->Size()),
-                      "memcpy scale failed");
   } else {
     scale_param_->const_scale_ = false;
-    scale_ = nullptr;
   }

-  if (input_tensors_.size() == DIMENSION_2D) {
+  if (input_tensors_.size() == DIMENSION_3D && input_tensors_.at(kBiasIndex)->data() != nullptr) {
     scale_param_->const_offset_ = true;
-    offset_ =
-      reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, scale_tensor->Size(), kOfflinePackWeight));
-    MS_CHECK_PTR(offset_);
-    MS_CHECK_RET_CODE(memset_s(offset_, scale_tensor->Size(), 0, scale_tensor->Size()), "memset_s failed!");
-  } else if (input_tensors_.size() == DIMENSION_3D && input_tensors_.at(kBiasIndex)->data() != nullptr) {
-    scale_param_->const_offset_ = true;
-    Tensor *offset_tensor = input_tensors_.at(kBiasIndex);
-    MS_CHECK_PTR(offset_tensor);
-    offset_ =
-      reinterpret_cast<float *>(allocator_->Malloc(kNumberTypeFloat32, offset_tensor->Size(), kOfflinePackWeight));
-    MS_CHECK_PTR(offset_);
-    MS_CHECK_TRUE(offset_tensor->Size() > 0, "invalid offset tensor size");
-    MS_CHECK_RET_CODE(memcpy_s(offset_, offset_tensor->Size(), offset_tensor->data(), offset_tensor->Size()),
-                      "memcpy_s failed!");
   } else {
     scale_param_->const_offset_ = false;
-    offset_ = nullptr;
   }
   return RET_OK;
 }
@@ -125,25 +103,29 @@ int ScaleFP32Coder::DoCode(CoderContext *const context) {

   NNaclFp32Serializer code;
   code.CodeStruct("scale_parameter", *scale_param_);
-
+  auto scale = allocator_->GetRuntimeAddr(input_tensors_.at(kWeightIndex), scale_param_->const_scale_);
+  std::string offset{"NULL"};
+  if (input_tensors_.size() == DIMENSION_3D) {
+    offset = allocator_->GetRuntimeAddr(input_tensors_.at(kBiasIndex), scale_param_->const_offset_);
+  }
   switch (scale_param_->activation_type_) {
     case schema::ActivationType_RELU6:
-      code.CodeFunction("DoScaleRelu6", input_tensor_, output_tensor_, scale_, offset_, kDefaultTaskId,
+      code.CodeFunction("DoScaleRelu6", input_tensor_, output_tensor_, scale, offset, kDefaultTaskId,
                         "&scale_parameter");
       break;
     case schema::ActivationType_RELU: {
       if (!support_parallel_) {
-        code.CodeFunction("DoScaleRelu", input_tensor_, output_tensor_, scale_, offset_, kDefaultTaskId,
+        code.CodeFunction("DoScaleRelu", input_tensor_, output_tensor_, scale, offset, kDefaultTaskId,
                           "&scale_parameter");
       } else {
-        code.CodeBaseStruct("ScaleFp32Args", kRunArgs, input_tensor_, output_tensor_, scale_, offset_,
+        code.CodeBaseStruct("ScaleFp32Args", kRunArgs, input_tensor_, output_tensor_, scale, offset,
                             "&scale_parameter");
         code.CodeFunction(kParallelLaunch, "DoScaleReluRun", kRunArgsAddr, "scale_parameter.op_parameter_.thread_num_");
       }
       break;
     }
     case schema::ActivationType_NO_ACTIVATION:
-      code.CodeFunction("DoScale", input_tensor_, output_tensor_, scale_, offset_, kDefaultTaskId, "&scale_parameter");
+      code.CodeFunction("DoScale", input_tensor_, output_tensor_, scale, offset, kDefaultTaskId, "&scale_parameter");
       break;
     default:
       MS_LOG(ERROR) << "Scale does not support activation type " << scale_param_->activation_type_;
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.h
index 7f8e6242..319ad35a 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/scale_fp32_coder.h
@@ -39,8 +39,6 @@ class ScaleFP32Coder final : public OperatorCoder {

  private:
   ScaleParameter *scale_param_{nullptr};
-  float *scale_{nullptr};
-  float *offset_{nullptr};
 };
 }  // namespace mindspore::lite::micro::nnacl
 #endif  // MICRO_CODER_OPCODERS_FP32__CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.cc
new file mode 100644
index 00000000..6f817386
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.cc
@@ -0,0 +1,77 @@
+/**
+ * Copyright 2022 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "coder/opcoders/nnacl/fp32/split_fp32_coder.h"
+#include "coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h"
+#include "coder/opcoders/file_collector.h"
+#include "coder/opcoders/parallel.h"
+#include "src/runtime/kernel/cpu/base/split_base.h"
+
+using mindspore::schema::PrimitiveType_Split;
+
+namespace mindspore::lite::micro::nnacl {
+int SplitFP32Coder::Prepare(CoderContext *const context) {
+  auto status = mindspore::kernel::SplitBaseCPUKernel::CheckAndInitSplitParam(
+    *input_tensor_, reinterpret_cast<SplitParameter *>(parameter_));
+  if (RET_OK != status) {
+    MS_LOG(ERROR) << "CheckAndInitSplitParam failed";
+    return status;
+  }
+  return RET_OK;
+}
+
+int SplitFP32Coder::DoCode(CoderContext *const context) {
+  Collect(context, {"nnacl/base/split_base.h"}, {"split_base.c"});
+  if (support_parallel_) {
+    Collect(context, {"wrapper/fp32/split_fp32_wrapper.h"}, {"split_fp32_wrapper.c"});
+  }
+  auto param = reinterpret_cast<SplitParameter *>(parameter_);
+  int num_unit = param->split_count_ * param->num_split_;
+
+  NNaclFp32Serializer code;
+  code << "    void *output_ptrs[" << output_tensors_.size() << "] = {";
+  for (int i = 0; i < param->num_split_; i++) {
+    code << allocator_->GetRuntimeAddr(output_tensors_.at(i)) << ",";
+  }
+  code << "};\n";
+  code << "    int input_dim[" << input_tensor_->shape().size() << "] = {";
+  for (auto &dim : input_tensor_->shape()) {
+    code << dim << ",";
+  }
+  code << "};\n";
+  code << "    int split_sizes[" << param->num_split_ << "] = {";
+  for (int i = 0; i < param->num_split_; i++) {
+    code << param->split_sizes_[i] << ",";
+  }
+  code << "};\n";
+
+  code.CodeStruct("split_param", *param);
+  if (!support_parallel_) {
+    code.CodeFunction("DoSplit", input_tensor_, "(void *)output_ptrs", "input_dim", "0", num_unit, "&split_param",
+                      lite::DataTypeSize(input_tensor_->data_type()));
+  } else {
+    code.CodeBaseStruct("SplitFp32Args", kRunArgs, input_tensor_, "(void *)output_ptrs", "input_dim", num_unit,
+                        lite::DataTypeSize(input_tensor_->data_type()), "&split_param");
+    code.CodeFunction(kParallelLaunch, "DoSplitRun", kRunArgsAddr, "split_param.op_parameter_.thread_num_");
+  }
+
+  context->AppendCode(code.str());
+  return RET_OK;
+}
+
+REG_OPERATOR_CODER(kAllTargets, kNumberTypeFloat32, PrimitiveType_Split, CPUOpCoderCreator<SplitFP32Coder>)
+REG_OPERATOR_CODER(kAllTargets, kNumberTypeInt32, PrimitiveType_Split, CPUOpCoderCreator<SplitFP32Coder>)
+REG_OPERATOR_CODER(kAllTargets, kNumberTypeFloat16, PrimitiveType_Split, CPUOpCoderCreator<SplitFP32Coder>)
+}  // namespace mindspore::lite::micro::nnacl
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.h
new file mode 100644
index 00000000..f65214c1
--- /dev/null
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/split_fp32_coder.h
@@ -0,0 +1,37 @@
+/**
+ * Copyright 2022 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_SPLIT_FP32_CODER_H_
+#define MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_SPLIT_FP32_CODER_H_
+
+#include <vector>
+#include "coder/opcoders/op_coder.h"
+#include "nnacl/split_parameter.h"
+
+namespace mindspore::lite::micro::nnacl {
+class SplitFP32Coder : public OperatorCoder {
+ public:
+  SplitFP32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
+                 const LiteGraph::Node *node, size_t node_index, Target target)
+      : OperatorCoder(in_tensors, out_tensors, node, node_index, target) {}
+  ~SplitFP32Coder() override = default;
+
+  int Prepare(CoderContext *const context) override;
+
+  int DoCode(CoderContext *const context) override;
+};
+}  // namespace mindspore::lite::micro::nnacl
+#endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_SPLIT_FP32_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.cc
index 2512c9a7..a5882722 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.cc
@@ -48,10 +48,6 @@ int TransposeFp32Coder::Resize() {
     param_->out_strides_[i] = out_shape.at(i + 1) * param_->out_strides_[i + 1];
   }

-  out_shape_ =
-    reinterpret_cast<int *>(allocator_->Malloc(kNumberTypeInt32, out_shape.size() * sizeof(int), kOfflinePackWeight));
-  MS_CHECK_PTR(out_shape_);
-  memcpy(out_shape_, out_shape.data(), in_shape.size() * sizeof(int));
   return RET_OK;
 }

@@ -141,7 +137,9 @@ int TransposeFp32Coder::DoCode(CoderContext *const context) {
   }

   code.CodeStruct("trans_param", *param_);
-  dims_ = output_tensor_->shape().size();
+  auto out_shape = output_tensor_->shape();
+  dims_ = static_cast<int>(out_shape.size());
+  code.CodeArray("output_shape", out_shape.data(), dims_, true);
   if (dims_ > MAX_TRANSPOSE_DIM_SIZE) {
     int *dim_size = reinterpret_cast<int *>(malloc(dims_ * sizeof(int)));
     if (dim_size == nullptr) {
@@ -149,7 +147,7 @@ int TransposeFp32Coder::DoCode(CoderContext *const context) {
     }
     *(dim_size + dims_ - 1) = 1;
     for (int i = dims_ - 1; i > 0; --i) {
-      *(dim_size + i - 1) = *(dim_size + i) * out_shape_[i];
+      *(dim_size + i - 1) = *(dim_size + i) * out_shape[i];
     }
     code.CodeArray("dim_size", dim_size, dims_);
     int *position = reinterpret_cast<int *>(malloc(dims_ * thread_num_ * sizeof(int)));
@@ -158,12 +156,12 @@ int TransposeFp32Coder::DoCode(CoderContext *const context) {
       return RET_NULL_PTR;
     }
     code.CodeArray("position", position, dims_ * thread_num_);
-    code.CodeFunction("TransposeDimsFp32", input_tensor_, output_tensor_, out_shape_, "dim_size", "position",
+    code.CodeFunction("TransposeDimsFp32", input_tensor_, output_tensor_, "output_shape", "dim_size", "position",
                       "&trans_param", kDefaultTaskId, thread_num_);
     free(dim_size);
     free(position);
   } else {
-    code.CodeFunction("DoTransposeFp32", input_tensor_, output_tensor_, out_shape_, "&trans_param");
+    code.CodeFunction("DoTransposeFp32", input_tensor_, output_tensor_, "output_shape", "&trans_param");
   }
   context->AppendCode(code.str());
   return RET_OK;
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.h b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.h
index c4cd37a9..0fdbb407 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/nnacl/fp32/transpose_fp32_coder.h
@@ -21,7 +21,7 @@
 #include "coder/opcoders/op_coder.h"
 #include "nnacl/transpose.h"
 namespace mindspore::lite::micro::nnacl {
-class TransposeFp32Coder final : public OperatorCoder {
+class TransposeFp32Coder : public OperatorCoder {
  public:
   TransposeFp32Coder(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                      const LiteGraph::Node *node, size_t node_index, Target target)
@@ -33,18 +33,18 @@ class TransposeFp32Coder final : public OperatorCoder {

   int DoCode(CoderContext *const context) override;

-  int Resize();
+  virtual int Resize();

   int Init();

+ protected:
+  TransposeParameter *param_{nullptr};
+  int dims_{0};
+
  private:
   void GetNHNCTransposeFunc();
-
-  TransposeParameter *param_{nullptr};
-  int *out_shape_{nullptr};
   std::string NHNCTransposeFunc_;
   int nhnc_param_[3];
-  int dims_{0};
 };
 }  // namespace mindspore::lite::micro::nnacl
 #endif  // MINDSPORE_LITE_TOOLS_CONVERTER_MICRO_CODER_OPCODERS_NNACL_FP32_TRANSPOSE_FP32_CODER_H_
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.cc b/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.cc
index 49314886..c333b621 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.cc
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.cc
@@ -177,6 +177,25 @@ void NNaclFp32Serializer::CodeStruct(const std::string &name, const OpParameter
                         op_param.is_train_session_, op_param.is_zero_shape_);
 }

+void NNaclFp32Serializer::CodeStruct(const std::string &name, const SplitParameter &split_parameter) {
+  CodeBaseStruct("SplitParameter", name, split_parameter.op_parameter_, split_parameter.num_split_, "split_sizes",
+                 split_parameter.split_dim_, ToString(split_parameter.strides_), "{0}", split_parameter.n_dims_,
+                 split_parameter.split_count_);
+}
+
+void NNaclFp32Serializer::CodeStruct(const std::string &name, const LayerNormParameter &op_param) {
+  CodeBaseStruct<false>("LayerNormParameter", name, op_param.op_parameter_, op_param.epsilon_,
+                        op_param.elementwise_mode_, op_param.elementwise_affine_, op_param.begin_norm_axis_,
+                        op_param.begin_params_axis_, op_param.norm_inner_size_, op_param.norm_outer_size_,
+                        op_param.params_inner_size_, op_param.params_outer_size_, op_param.normalized_dims_,
+                        ToString(op_param.normalized_shape_), op_param.thread_count_, op_param.thread_outsize_);
+}
+
+void NNaclFp32Serializer::CodeStruct(const std::string &name, const BroadcastShapeInfo &op_param) {
+  CodeBaseStruct<false>("BroadcastShapeInfo", name, ToString(op_param.input_shape_), op_param.input_shape_size_,
+                        ToString(op_param.output_shape_), op_param.output_shape_size_);
+}
+
 void NNaclFp32Serializer::CodeArrayStruct(const std::string &name, TensorC *tensorC, std::vector<Tensor *> tensor) {
   std::vector<std::string> tensor_names;
   int size = tensor.size();
diff --git a/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h b/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h
index 8e1350f5..f52ced20 100644
--- a/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h
+++ b/mindspore/lite/tools/converter/micro/coder/opcoders/serializers/nnacl_serializer/nnacl_fp32_serializer.h
@@ -41,6 +41,9 @@
 #include "wrapper/fp32/arithmetic_fp32_wrapper.h"
 #include "wrapper/base/affine_wrapper.h"
 #include "wrapper/fp32/conv_winograd_fp32_wrapper.h"
+#include "nnacl/layer_norm_parameter.h"
+#include "nnacl/broadcast_to_parameter.h"
+#include "nnacl/split_parameter.h"

 namespace mindspore::lite::micro::nnacl {
 class NNaclFp32Serializer : public Serializer {
@@ -68,6 +71,9 @@ class NNaclFp32Serializer : public Serializer {
   void CodeStruct(const std::string &name, const GroupNormParameter &gn_param);
   void CodeStruct(const std::string &name, const ActivationParameter &activation_parameter);
   void CodeStruct(const std::string &name, const OpParameter &op_param);
+  void CodeStruct(const std::string &name, const SplitParameter &split_parameter);
+  void CodeStruct(const std::string &name, const LayerNormParameter &param);
+  void CodeStruct(const std::string &name, const BroadcastShapeInfo &param);
   void CodeArrayStruct(const std::string &name, TensorC *tensorC, std::vector<Tensor *> tensor);

  private:
diff --git a/mindspore/lite/tools/converter/micro/coder/session.cc b/mindspore/lite/tools/converter/micro/coder/session.cc
index 10dc2dc6..471f1491 100644
--- a/mindspore/lite/tools/converter/micro/coder/session.cc
+++ b/mindspore/lite/tools/converter/micro/coder/session.cc
@@ -119,12 +119,13 @@ int CoderSession::GenerateCode() {
   return ret;
 }

-int CoderSession::Init(const void *content, int size) {
+int CoderSession::Init(const void *content, int size, bool enableFp16) {
   MS_LOG(INFO) << "CoderSession::Init start";
   Model *model = lite::Model::Import(static_cast<const char *>(content), size);
   MS_CHECK_PTR(model);
   coder_graph_ = std::make_unique<CoderGraph>(model);
   context_ = std::make_unique<CoderContext>();
+  enableFp16_ = enableFp16;
   MS_LOG(INFO) << "CoderSession::Init done";
   return RET_OK;
 }
@@ -299,7 +300,7 @@ int CoderSession::CreateOpCoders() {
 }

 int CoderSession::InitCodeGraph() {
-  MS_CHECK_RET_CODE(coder_graph_->ConvertTensors(), "convert tensors failed");
+  MS_CHECK_RET_CODE(coder_graph_->ConvertTensors(enableFp16_), "convert tensors failed");
   MS_CHECK_RET_CODE(coder_graph_->InitGraphInOutTensors(), "init graph inputs and outputs failed");
   return RET_OK;
 }
diff --git a/mindspore/lite/tools/converter/micro/coder/session.h b/mindspore/lite/tools/converter/micro/coder/session.h
index f1039af0..3a8f7290 100644
--- a/mindspore/lite/tools/converter/micro/coder/session.h
+++ b/mindspore/lite/tools/converter/micro/coder/session.h
@@ -34,7 +34,7 @@ class CoderSession {

   ~CoderSession();

-  int Init(const void *content, int size);
+  int Init(const void *content, int size, bool enableFp16);

   int Build();

@@ -57,6 +57,7 @@ class CoderSession {
   MemoryAllocator *allocator_{nullptr};
   std::vector<std::unique_ptr<OperatorCoder>> op_coders_;
   int schema_version_ = SCHEMA_VERSION::SCHEMA_CUR;
+  bool enableFp16_{false};
 };

 std::shared_ptr<CoderSession> CreateCoderSession();
--
2.17.1