OpenHarmony-v6.0-Release/s

/*
 * Copyright (c) 2023 Huawei Device Co., Ltd.
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#ifndef NEURAL_NETWORK_RUNTIME_NNCOMPILER_H
#define NEURAL_NETWORK_RUNTIME_NNCOMPILER_H

#include "compiler.h"

#include "mindir.h"
#include "device.h"
#include "inner_model.h"
#include "prepared_model.h"
#include "nnexecutor.h"

namespace OHOS {
namespace NeuralNetworkRuntime {

class NNCompiler : public Compiler {
public:
    NNCompiler() = delete;
    NNCompiler(std::shared_ptr<Device> device, size_t backendID);
    NNCompiler(const void* model, std::shared_ptr<Device> device, size_t backendID);
    ~NNCompiler() override;

    size_t GetBackendID() const override;

    OH_NN_ReturnCode SetCacheDir(const std::string& cacheModelPath, uint32_t version) override;
    OH_NN_ReturnCode SetPerformance(OH_NN_PerformanceMode performance) override;
    OH_NN_ReturnCode SetPriority(OH_NN_Priority priority) override;
    OH_NN_ReturnCode SetEnableFp16(bool isFp16) override;

    bool IsBuild() const override;
    OH_NN_ReturnCode Build() override;

    OH_NN_ReturnCode SaveToCacheFile() const override;
    OH_NN_ReturnCode RestoreFromCacheFile() override;
    OH_NN_ReturnCode SaveToCacheBuffer(const void* buffer, size_t length, size_t* modelSize) const override;
    OH_NN_ReturnCode RestoreFromCacheBuffer(const void* buffer, size_t length) override;

    OH_NN_ReturnCode SetExtensionConfig(const std::unordered_map<std::string, std::vector<char>>& configs) override;
    OH_NN_ReturnCode SetOptions(const std::vector<std::shared_ptr<void>>& options) override;
    OH_NN_ReturnCode GetModelName(std::string& modelName) override;
    size_t GetModelSize() override;
    size_t GetOnlineModelID() override;

    NNExecutor* CreateExecutor();

private:
    void ReleaseBuffer(std::vector<Buffer>& buffers) const;
    void ReleaseBufferByDevice(std::vector<Buffer>& buffers) const;
    OH_NN_ReturnCode SerializeTensorsToBuffer(
        const std::vector<std::pair<std::shared_ptr<TensorDesc>, OH_NN_TensorType>>& tensorDescs,
        Buffer& buffer) const;
    OH_NN_ReturnCode DeserializedTensorsFromBuffer(
        const Buffer& buffer, std::vector<std::pair<std::shared_ptr<TensorDesc>, OH_NN_TensorType>>& tensorDescs);

    OH_NN_ReturnCode OnlineBuild();
    OH_NN_ReturnCode NormalBuild();
    OH_NN_ReturnCode BuildOfflineModel();
    OH_NN_ReturnCode CheckModelParameter() const;
    OH_NN_ReturnCode IsOfflineModel(bool& isOfflineModel) const;
    OH_NN_ReturnCode IsSupportedModel(const std::shared_ptr<mindspore::lite::LiteGraph>& liteGraph,
                                      bool& isSupportedModel) const;

    size_t GetModelSizeFromCache(std::string& path, const std::string& modelName);
    size_t GetModelSizeFromFile(std::string& path);
    size_t GetModelSizeFromModel(InnerModel* innerModel);
    OH_NN_ReturnCode GetNNRtModelIDFromCache(const std::string& path, const std::string& modelName,
        size_t& nnrtModelID);
    OH_NN_ReturnCode GetNNRtModelIDFromModel(InnerModel* innerModel, size_t& nnrtModelID);
    size_t GetOnlineModelID(const std::shared_ptr<mindspore::lite::LiteGraph>& liteGraph);
    std::vector<mindspore::lite::LiteGraph::Node*> GetNodeIndices(
        const std::shared_ptr<mindspore::lite::LiteGraph>& liteGraph, size_t layer);
    size_t DataTypeSize(mindspore::lite::DataType dataType);
    size_t GetFileSize(const char* fileName);

private:
    bool m_isBuild {false};
    bool m_enableFp16 {false};
    std::string m_cachePath;
    uint32_t m_cacheVersion {0};
    std::shared_ptr<Device> m_device {nullptr};
    size_t m_backendID {0};
    OH_NN_Priority m_priority {OH_NN_PRIORITY_NONE};
    OH_NN_PerformanceMode m_performance {OH_NN_PERFORMANCE_NONE};
    std::shared_ptr<PreparedModel> m_preparedModel {nullptr};
    void* m_metaGraph {nullptr};
    InnerModel* m_innerModel {nullptr};
    std::shared_ptr<mindspore::lite::LiteGraph> m_liteGraph {nullptr};
    std::vector<std::pair<std::shared_ptr<TensorDesc>, OH_NN_TensorType>> m_inputTensorDescs;
    std::vector<std::pair<std::shared_ptr<TensorDesc>, OH_NN_TensorType>> m_outputTensorDescs;
    ExtensionConfig m_extensionConfig;
};
} // NeuralNetworkRuntime
} // OHOS

#endif // NEURAL_NETWORK_RUNTIME_NNCOMPILER_H