android-12.0.0_r34/search

/* Copyright 2020 The TensorFlow Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/
#include "tensorflow/lite/tools/optimize/modify_model_interface.h"

#include <memory>

#include <gmock/gmock.h>
#include <gtest/gtest.h>
#include "absl/memory/memory.h"
#include "tensorflow/lite/model.h"
#include "tensorflow/lite/schema/schema_generated.h"
#include "tensorflow/lite/schema/schema_utils.h"

namespace tflite {
namespace optimize {
namespace {

// Create a model with 1 quant, 1 FC, 1 dequant
std::unique_ptr<ModelT> CreateQuantizedModelSingleInputOutput(
    const TensorType& quantization_type) {
  auto model = absl::make_unique<ModelT>();
  auto subgraph = absl::make_unique<tflite::SubGraphT>();
  auto buffer = absl::make_unique<tflite::BufferT>();
  auto quant_op_code = absl::make_unique<OperatorCodeT>();
  auto quant_op = absl::make_unique<OperatorT>();
  auto fc_op_code = absl::make_unique<OperatorCodeT>();
  auto fc_op = absl::make_unique<OperatorT>();
  auto dequant_op_code = absl::make_unique<OperatorCodeT>();
  auto dequant_op = absl::make_unique<OperatorT>();

  model->subgraphs.push_back(std::move(subgraph));

  // Op code
  quant_op_code->builtin_code = BuiltinOperator_QUANTIZE;
  quant_op_code->deprecated_builtin_code =
      static_cast<int8_t>(BuiltinOperator_QUANTIZE);
  quant_op_code->version = 2;

  fc_op_code->builtin_code = BuiltinOperator_FULLY_CONNECTED;
  fc_op_code->deprecated_builtin_code =
      static_cast<int8_t>(BuiltinOperator_FULLY_CONNECTED);
  fc_op_code->version = 2;

  dequant_op_code->builtin_code = BuiltinOperator_DEQUANTIZE;
  dequant_op_code->deprecated_builtin_code =
      static_cast<int8_t>(BuiltinOperator_DEQUANTIZE);
  dequant_op_code->version = 2;

  // Op.
  quant_op->opcode_index = 0;
  quant_op->inputs = {0};
  quant_op->outputs = {1};

  fc_op->opcode_index = 1;
  fc_op->inputs = {1};
  fc_op->outputs = {2};

  dequant_op->opcode_index = 2;
  dequant_op->inputs = {2};
  dequant_op->outputs = {3};

  model->subgraphs[0]->operators.push_back(std::move(quant_op));
  model->subgraphs[0]->operators.push_back(std::move(fc_op));
  model->subgraphs[0]->operators.push_back(std::move(dequant_op));

  model->operator_codes.push_back(std::move(quant_op_code));
  model->operator_codes.push_back(std::move(fc_op_code));
  model->operator_codes.push_back(std::move(dequant_op_code));

  // Model input/output.
  model->subgraphs[0]->inputs = {0};
  model->subgraphs[0]->outputs = {3};

  // Tensors
  auto tensor_0 = absl::make_unique<TensorT>();
  tensor_0->name = "tensor_0";
  tensor_0->shape = {};
  tensor_0->type = TensorType_FLOAT32;

  auto tensor_1 = absl::make_unique<TensorT>();
  tensor_1->quantization = absl::make_unique<QuantizationParametersT>();
  tensor_1->quantization->scale.push_back(0.35);
  tensor_1->quantization->zero_point.push_back(28);
  tensor_1->name = "tensor_1";
  tensor_1->shape = {};
  tensor_1->type = quantization_type;

  auto tensor_2 = absl::make_unique<TensorT>();
  tensor_2->quantization = absl::make_unique<QuantizationParametersT>();
  tensor_2->quantization->scale.push_back(0.12);
  tensor_2->quantization->zero_point.push_back(50);
  tensor_2->name = "tensor_2";
  tensor_2->shape = {};
  tensor_2->type = quantization_type;

  auto tensor_3 = absl::make_unique<TensorT>();
  tensor_3->name = "tensor_3";
  tensor_3->shape = {};
  tensor_3->type = TensorType_FLOAT32;

  model->subgraphs[0]->tensors.push_back(std::move(tensor_0));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_1));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_2));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_3));

  // Buffer
  model->buffers.push_back(std::move(buffer));

  return model;
}

// Create a model with 2 quant, 1 FC, 2 dequant
// The model mimics the behavior of the quantize_model.cc.
std::unique_ptr<ModelT> CreateQuantizedModelMultipleInputOutput(
    const TensorType& quantization_type) {
  auto model = absl::make_unique<ModelT>();
  auto subgraph = absl::make_unique<tflite::SubGraphT>();
  auto buffer = absl::make_unique<tflite::BufferT>();
  auto quant_op_code = absl::make_unique<OperatorCodeT>();
  auto quant_op_1 = absl::make_unique<OperatorT>();
  auto quant_op_2 = absl::make_unique<OperatorT>();
  auto fc_op_code = absl::make_unique<OperatorCodeT>();
  auto fc_op = absl::make_unique<OperatorT>();
  auto dequant_op_code = absl::make_unique<OperatorCodeT>();
  auto dequant_op_1 = absl::make_unique<OperatorT>();
  auto dequant_op_2 = absl::make_unique<OperatorT>();

  model->subgraphs.push_back(std::move(subgraph));

  // Op code
  quant_op_code->builtin_code = BuiltinOperator_QUANTIZE;
  quant_op_code->deprecated_builtin_code =
      static_cast<int8_t>(BuiltinOperator_QUANTIZE);
  quant_op_code->version = 2;

  fc_op_code->builtin_code = BuiltinOperator_FULLY_CONNECTED;
  fc_op_code->deprecated_builtin_code =
      static_cast<int8_t>(BuiltinOperator_FULLY_CONNECTED);
  fc_op_code->version = 2;

  dequant_op_code->builtin_code = BuiltinOperator_DEQUANTIZE;
  dequant_op_code->deprecated_builtin_code =
      static_cast<int8_t>(BuiltinOperator_DEQUANTIZE);
  dequant_op_code->version = 2;

  // Op.
  quant_op_1->opcode_index = 0;
  quant_op_1->inputs = {0};
  quant_op_1->outputs = {2};
  quant_op_2->opcode_index = 0;
  quant_op_2->inputs = {1};
  quant_op_2->outputs = {3};

  fc_op->opcode_index = 1;
  fc_op->inputs = {2, 3};
  fc_op->outputs = {4, 5};

  dequant_op_1->opcode_index = 2;
  dequant_op_1->inputs = {4};
  dequant_op_1->outputs = {6};
  dequant_op_2->opcode_index = 2;
  dequant_op_2->inputs = {5};
  dequant_op_2->outputs = {7};

  model->subgraphs[0]->operators.push_back(std::move(quant_op_1));
  model->subgraphs[0]->operators.push_back(std::move(quant_op_2));
  model->subgraphs[0]->operators.push_back(std::move(fc_op));
  model->subgraphs[0]->operators.push_back(std::move(dequant_op_1));
  model->subgraphs[0]->operators.push_back(std::move(dequant_op_2));

  model->operator_codes.push_back(std::move(quant_op_code));
  model->operator_codes.push_back(std::move(fc_op_code));
  model->operator_codes.push_back(std::move(dequant_op_code));

  // Model input/output.
  model->subgraphs[0]->inputs = {0, 1};
  model->subgraphs[0]->outputs = {6, 7};

  // Tensors
  auto tensor_0 = absl::make_unique<TensorT>();
  tensor_0->name = "tensor_0";
  tensor_0->shape = {};
  tensor_0->type = TensorType_FLOAT32;

  auto tensor_1 = absl::make_unique<TensorT>();
  tensor_1->name = "tensor_1";
  tensor_1->shape = {};
  tensor_1->type = TensorType_FLOAT32;

  auto tensor_2 = absl::make_unique<TensorT>();
  tensor_2->quantization = absl::make_unique<QuantizationParametersT>();
  tensor_2->quantization->scale.push_back(0.35);
  tensor_2->quantization->zero_point.push_back(28);
  tensor_2->name = "tensor_2";
  tensor_2->shape = {};
  tensor_2->type = quantization_type;

  auto tensor_3 = absl::make_unique<TensorT>();
  tensor_3->quantization = absl::make_unique<QuantizationParametersT>();
  tensor_3->quantization->scale.push_back(0.12);
  tensor_3->quantization->zero_point.push_back(50);
  tensor_3->name = "tensor_3";
  tensor_3->shape = {};
  tensor_3->type = quantization_type;

  auto tensor_4 = absl::make_unique<TensorT>();
  tensor_4->quantization = absl::make_unique<QuantizationParametersT>();
  tensor_4->quantization->scale.push_back(0.45);
  tensor_4->quantization->zero_point.push_back(28);
  tensor_4->name = "tensor_4";
  tensor_4->shape = {};
  tensor_4->type = quantization_type;

  auto tensor_5 = absl::make_unique<TensorT>();
  tensor_5->quantization = absl::make_unique<QuantizationParametersT>();
  tensor_5->quantization->scale.push_back(0.22);
  tensor_5->quantization->zero_point.push_back(50);
  tensor_5->name = "tensor_5";
  tensor_5->shape = {};
  tensor_5->type = quantization_type;

  auto tensor_6 = absl::make_unique<TensorT>();
  tensor_6->name = "tensor_6";
  tensor_6->shape = {};
  tensor_6->type = TensorType_FLOAT32;

  auto tensor_7 = absl::make_unique<TensorT>();
  tensor_7->name = "tensor_7";
  tensor_7->shape = {};
  tensor_7->type = TensorType_FLOAT32;

  model->subgraphs[0]->tensors.push_back(std::move(tensor_0));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_1));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_2));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_3));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_4));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_5));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_6));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_7));

  // Buffer
  model->buffers.push_back(std::move(buffer));

  return model;
}

// Create a model with 1 FC.
std::unique_ptr<ModelT> CreateFloatModel() {
  auto model = absl::make_unique<ModelT>();
  auto subgraph = absl::make_unique<tflite::SubGraphT>();
  auto buffer = absl::make_unique<tflite::BufferT>();
  auto fc_op_code = absl::make_unique<OperatorCodeT>();
  auto fc_op = absl::make_unique<OperatorT>();

  model->subgraphs.push_back(std::move(subgraph));

  // Op code
  fc_op_code->builtin_code = BuiltinOperator_FULLY_CONNECTED;
  fc_op_code->deprecated_builtin_code =
      static_cast<int8_t>(BuiltinOperator_FULLY_CONNECTED);
  fc_op_code->version = 2;

  // Op.
  fc_op->opcode_index = 0;
  fc_op->inputs = {0};
  fc_op->outputs = {1};

  model->subgraphs[0]->operators.push_back(std::move(fc_op));
  model->operator_codes.push_back(std::move(fc_op_code));

  // Model input/output.
  model->subgraphs[0]->inputs = {0};
  model->subgraphs[0]->outputs = {1};

  // Tensors
  auto tensor_0 = absl::make_unique<TensorT>();
  tensor_0->name = "tensor_0";
  tensor_0->shape = {};
  tensor_0->type = TensorType_FLOAT32;

  auto tensor_1 = absl::make_unique<TensorT>();
  tensor_1->name = "tensor_1";
  tensor_1->shape = {};
  tensor_1->type = TensorType_FLOAT32;

  model->subgraphs[0]->tensors.push_back(std::move(tensor_0));
  model->subgraphs[0]->tensors.push_back(std::move(tensor_1));

  // Buffer
  model->buffers.push_back(std::move(buffer));

  return model;
}

struct ModelInterface : ::testing::TestWithParam<tflite::TensorType> {};

TEST_P(ModelInterface, SingleInputOutput) {
  TensorType quantization_type = GetParam();

  auto model = CreateQuantizedModelSingleInputOutput(quantization_type);

  // Change model type.
  flatbuffers::FlatBufferBuilder builder;
  EXPECT_EQ(ModifyModelInterface(&builder, model.get(), quantization_type,
                                 quantization_type),
            kTfLiteOk);

  // Verify results.
  EXPECT_EQ(model->subgraphs.size(), 1);
  // TODO(mnatraj): The float input tensor has not been removed.
  // EXPECT_EQ(model->subgraphs[0]->tensors.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->tensors.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->inputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->inputs[0], 1);
  EXPECT_EQ(model->subgraphs[0]->outputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->outputs[0], 2);
  EXPECT_EQ(model->operator_codes.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->operators.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->operators[0]->opcode_index, 1);

  auto fc_op = model->subgraphs[0]->operators[0].get();

  auto input = model->subgraphs[0]->tensors[fc_op->inputs[0]].get();
  EXPECT_EQ(input->name, "tensor_1");
  EXPECT_EQ(input->type, quantization_type);
  EXPECT_FLOAT_EQ(input->quantization->scale[0], 0.35);
  EXPECT_EQ(input->quantization->zero_point[0], 28);

  auto output = model->subgraphs[0]->tensors[fc_op->outputs[0]].get();
  EXPECT_EQ(output->name, "tensor_2");
  EXPECT_EQ(output->type, quantization_type);
  EXPECT_FLOAT_EQ(output->quantization->scale[0], 0.12);
  EXPECT_EQ(output->quantization->zero_point[0], 50);
}

TEST_P(ModelInterface, MutipleInputOutput) {
  TensorType quantization_type = GetParam();

  auto model = CreateQuantizedModelMultipleInputOutput(quantization_type);

  // Change model type.
  flatbuffers::FlatBufferBuilder builder;
  EXPECT_EQ(ModifyModelInterface(&builder, model.get(), quantization_type,
                                 quantization_type),
            kTfLiteOk);

  // Verify results.
  EXPECT_EQ(model->subgraphs.size(), 1);
  // TODO (b/158254056): Remove unused inputs and outputs from tensor list
  // EXPECT_EQ(model->subgraphs[0]->tensors.size(), 4);
  EXPECT_EQ(model->subgraphs[0]->tensors.size(), 6);
  EXPECT_EQ(model->subgraphs[0]->inputs.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->inputs[0], 2);
  EXPECT_EQ(model->subgraphs[0]->inputs[1], 3);
  EXPECT_EQ(model->subgraphs[0]->outputs.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->outputs[0], 4);
  EXPECT_EQ(model->subgraphs[0]->outputs[1], 5);
  EXPECT_EQ(model->operator_codes.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->operators.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->operators[0]->opcode_index, 1);

  auto fc_op = model->subgraphs[0]->operators[0].get();

  auto input_1 = model->subgraphs[0]->tensors[fc_op->inputs[0]].get();
  EXPECT_EQ(input_1->name, "tensor_2");
  EXPECT_EQ(input_1->type, quantization_type);
  EXPECT_FLOAT_EQ(input_1->quantization->scale[0], 0.35);
  EXPECT_EQ(input_1->quantization->zero_point[0], 28);

  auto input_2 = model->subgraphs[0]->tensors[fc_op->inputs[1]].get();
  EXPECT_EQ(input_2->name, "tensor_3");
  EXPECT_EQ(input_2->type, quantization_type);
  EXPECT_FLOAT_EQ(input_2->quantization->scale[0], 0.12);
  EXPECT_EQ(input_2->quantization->zero_point[0], 50);

  auto output_1 = model->subgraphs[0]->tensors[fc_op->outputs[0]].get();
  EXPECT_EQ(output_1->name, "tensor_4");
  EXPECT_EQ(output_1->type, quantization_type);
  EXPECT_FLOAT_EQ(output_1->quantization->scale[0], 0.45);
  EXPECT_EQ(output_1->quantization->zero_point[0], 28);

  auto output_2 = model->subgraphs[0]->tensors[fc_op->outputs[1]].get();
  EXPECT_EQ(output_2->name, "tensor_5");
  EXPECT_EQ(output_2->type, quantization_type);
  EXPECT_FLOAT_EQ(output_2->quantization->scale[0], 0.22);
  EXPECT_EQ(output_2->quantization->zero_point[0], 50);
}

INSTANTIATE_TEST_SUITE_P(MultipleInputOutputTests, ModelInterface,
                         ::testing::Values(TensorType_INT8, TensorType_INT16));

TEST(ModelInterface, MixedTypeSingleInputOutput) {
  auto model = CreateQuantizedModelSingleInputOutput(TensorType_INT8);

  // Change model type.
  flatbuffers::FlatBufferBuilder builder;
  EXPECT_EQ(ModifyModelInterface(&builder, model.get(), TensorType_UINT8,
                                 TensorType_INT8),
            kTfLiteOk);

  // Verify results.
  EXPECT_EQ(model->subgraphs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->tensors.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->inputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->inputs[0], 0);
  EXPECT_EQ(model->subgraphs[0]->outputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->outputs[0], 2);
  EXPECT_EQ(model->operator_codes.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->operators.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->operators[0]->opcode_index, 0);
  EXPECT_EQ(model->subgraphs[0]->operators[1]->opcode_index, 1);

  auto quant_op = model->subgraphs[0]->operators[0].get();
  auto input = model->subgraphs[0]->tensors[quant_op->inputs[0]].get();
  EXPECT_EQ(input->name, "tensor_0");
  EXPECT_EQ(input->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(input->quantization->scale[0], 0.35);
  EXPECT_EQ(input->quantization->zero_point[0], 156);

  auto fc_op = model->subgraphs[0]->operators[1].get();
  auto output = model->subgraphs[0]->tensors[fc_op->outputs[0]].get();
  EXPECT_EQ(output->name, "tensor_2");
  EXPECT_EQ(output->type, TensorType_INT8);
  EXPECT_FLOAT_EQ(output->quantization->scale[0], 0.12);
  EXPECT_EQ(output->quantization->zero_point[0], 50);
}

TEST(ModelInterface, Uint8SingleInputOutput) {
  auto model = CreateQuantizedModelSingleInputOutput(TensorType_INT8);

  // Change model type.
  flatbuffers::FlatBufferBuilder builder;
  EXPECT_EQ(ModifyModelInterface(&builder, model.get(), TensorType_UINT8,
                                 TensorType_UINT8),
            kTfLiteOk);

  // Verify results.
  EXPECT_EQ(model->subgraphs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->tensors.size(), 4);
  EXPECT_EQ(model->subgraphs[0]->inputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->inputs[0], 0);
  EXPECT_EQ(model->subgraphs[0]->outputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->outputs[0], 3);
  EXPECT_EQ(model->operator_codes.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->operators.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->operators[0]->opcode_index, 0);
  EXPECT_EQ(model->subgraphs[0]->operators[1]->opcode_index, 1);
  EXPECT_EQ(model->subgraphs[0]->operators[2]->opcode_index, 0);

  auto input_quant_op = model->subgraphs[0]->operators[0].get();
  auto input = model->subgraphs[0]->tensors[input_quant_op->inputs[0]].get();
  EXPECT_EQ(input->name, "tensor_0");
  EXPECT_EQ(input->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(input->quantization->scale[0], 0.35);
  EXPECT_EQ(input->quantization->zero_point[0], 156);

  auto output_quant_op = model->subgraphs[0]->operators[2].get();
  auto output = model->subgraphs[0]->tensors[output_quant_op->outputs[0]].get();
  EXPECT_EQ(output->name, "tensor_3");
  EXPECT_EQ(output->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(output->quantization->scale[0], 0.12);
  EXPECT_EQ(output->quantization->zero_point[0], 178);
}

TEST(ModelInterface, Uint8MutipleInputOutput) {
  auto model = CreateQuantizedModelMultipleInputOutput(TensorType_INT8);

  // Change model type.
  flatbuffers::FlatBufferBuilder builder;
  EXPECT_EQ(ModifyModelInterface(&builder, model.get(), TensorType_UINT8,
                                 TensorType_UINT8),
            kTfLiteOk);

  // Verify results.
  EXPECT_EQ(model->subgraphs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->tensors.size(), 8);
  EXPECT_EQ(model->subgraphs[0]->inputs.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->inputs[0], 0);
  EXPECT_EQ(model->subgraphs[0]->inputs[1], 1);
  EXPECT_EQ(model->subgraphs[0]->outputs.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->outputs[0], 6);
  EXPECT_EQ(model->subgraphs[0]->outputs[1], 7);
  EXPECT_EQ(model->operator_codes.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->operators.size(), 5);
  EXPECT_EQ(model->subgraphs[0]->operators[0]->opcode_index, 0);
  EXPECT_EQ(model->subgraphs[0]->operators[1]->opcode_index, 0);
  EXPECT_EQ(model->subgraphs[0]->operators[2]->opcode_index, 1);
  EXPECT_EQ(model->subgraphs[0]->operators[3]->opcode_index, 0);
  EXPECT_EQ(model->subgraphs[0]->operators[4]->opcode_index, 0);

  auto input_quant_1 = model->subgraphs[0]->operators[0].get();
  auto input_1 = model->subgraphs[0]->tensors[input_quant_1->inputs[0]].get();
  EXPECT_EQ(input_1->name, "tensor_0");
  EXPECT_EQ(input_1->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(input_1->quantization->scale[0], 0.35);
  EXPECT_EQ(input_1->quantization->zero_point[0], 156);

  auto input_quant_2 = model->subgraphs[0]->operators[1].get();
  auto input_2 = model->subgraphs[0]->tensors[input_quant_2->inputs[0]].get();
  EXPECT_EQ(input_2->name, "tensor_1");
  EXPECT_EQ(input_2->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(input_2->quantization->scale[0], 0.12);
  EXPECT_EQ(input_2->quantization->zero_point[0], 178);

  auto output_quant_1 = model->subgraphs[0]->operators[3].get();
  auto output_1 =
      model->subgraphs[0]->tensors[output_quant_1->outputs[0]].get();
  EXPECT_EQ(output_1->name, "tensor_6");
  EXPECT_EQ(output_1->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(output_1->quantization->scale[0], 0.45);
  EXPECT_EQ(output_1->quantization->zero_point[0], 156);

  auto output_quant_2 = model->subgraphs[0]->operators[4].get();
  auto output_2 =
      model->subgraphs[0]->tensors[output_quant_2->outputs[0]].get();
  EXPECT_EQ(output_2->name, "tensor_7");
  EXPECT_EQ(output_2->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(output_2->quantization->scale[0], 0.22);
  EXPECT_EQ(output_2->quantization->zero_point[0], 178);
}

TEST(ModelInterface, Int8MutipleInputOutput) {
  auto model = CreateQuantizedModelMultipleInputOutput(TensorType_INT8);

  // Change model type.
  flatbuffers::FlatBufferBuilder builder;
  EXPECT_EQ(ModifyModelInterface(&builder, model.get(), TensorType_INT8,
                                 TensorType_INT8),
            kTfLiteOk);

  // Verify results.
  EXPECT_EQ(model->subgraphs.size(), 1);
  // TODO(mnatraj): The two float input tensors have not been removed.
  // EXPECT_EQ(model->subgraphs[0]->tensors.size(), 4);
  EXPECT_EQ(model->subgraphs[0]->tensors.size(), 6);
  EXPECT_EQ(model->subgraphs[0]->inputs.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->inputs[0], 2);
  EXPECT_EQ(model->subgraphs[0]->inputs[1], 3);
  EXPECT_EQ(model->subgraphs[0]->outputs.size(), 2);
  EXPECT_EQ(model->subgraphs[0]->outputs[0], 4);
  EXPECT_EQ(model->subgraphs[0]->outputs[1], 5);
  EXPECT_EQ(model->operator_codes.size(), 3);
  EXPECT_EQ(model->subgraphs[0]->operators.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->operators[0]->opcode_index, 1);

  auto fc_op = model->subgraphs[0]->operators[0].get();

  auto input_1 = model->subgraphs[0]->tensors[fc_op->inputs[0]].get();
  EXPECT_EQ(input_1->name, "tensor_2");
  EXPECT_EQ(input_1->type, TensorType_INT8);
  EXPECT_FLOAT_EQ(input_1->quantization->scale[0], 0.35);
  EXPECT_EQ(input_1->quantization->zero_point[0], 28);

  auto input_2 = model->subgraphs[0]->tensors[fc_op->inputs[1]].get();
  EXPECT_EQ(input_2->name, "tensor_3");
  EXPECT_EQ(input_2->type, TensorType_INT8);
  EXPECT_FLOAT_EQ(input_2->quantization->scale[0], 0.12);
  EXPECT_EQ(input_2->quantization->zero_point[0], 50);

  auto output_1 = model->subgraphs[0]->tensors[fc_op->outputs[0]].get();
  EXPECT_EQ(output_1->name, "tensor_4");
  EXPECT_EQ(output_1->type, TensorType_INT8);
  EXPECT_FLOAT_EQ(output_1->quantization->scale[0], 0.45);
  EXPECT_EQ(output_1->quantization->zero_point[0], 28);

  auto output_2 = model->subgraphs[0]->tensors[fc_op->outputs[1]].get();
  EXPECT_EQ(output_2->name, "tensor_5");
  EXPECT_EQ(output_2->type, TensorType_INT8);
  EXPECT_FLOAT_EQ(output_2->quantization->scale[0], 0.22);
  EXPECT_EQ(output_2->quantization->zero_point[0], 50);
}

TEST(ModelInterface, Float) {
  // Create the model.
  std::unique_ptr<ModelT> input_model_t = CreateFloatModel();
  flatbuffers::FlatBufferBuilder builder_temp;
  flatbuffers::Offset<Model> output_model_location =
      Model::Pack(builder_temp, input_model_t.get());
  FinishModelBuffer(builder_temp, output_model_location);
  const uint8_t* buffer_temp = builder_temp.GetBufferPointer();
  const Model* input_model = GetModel(buffer_temp);

  // Change model type.
  flatbuffers::FlatBufferBuilder builder;
  EXPECT_EQ(Uint8QuantizeModelInputsOutputs(&builder, input_model,
                                            {{"tensor_0", {0.4, 2}}},
                                            {{"tensor_1", {0.5, -5}}}),
            kTfLiteOk);

  const uint8_t* buffer = builder.GetBufferPointer();
  const Model* output_model = GetModel(buffer);
  std::unique_ptr<ModelT> model;
  model.reset(output_model->UnPack());

  // Verify results.
  EXPECT_EQ(model->subgraphs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->tensors.size(), 4);
  EXPECT_EQ(model->subgraphs[0]->inputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->inputs[0], 0);
  EXPECT_EQ(model->subgraphs[0]->outputs.size(), 1);
  EXPECT_EQ(model->subgraphs[0]->outputs[0], 1);
  EXPECT_EQ(model->operator_codes.size(), 3);
  EXPECT_EQ(GetBuiltinCode(model->operator_codes[0].get()),
            BuiltinOperator_FULLY_CONNECTED);
  EXPECT_EQ(GetBuiltinCode(model->operator_codes[1].get()),
            BuiltinOperator_DEQUANTIZE);
  EXPECT_EQ(GetBuiltinCode(model->operator_codes[2].get()),
            BuiltinOperator_QUANTIZE);
  EXPECT_EQ(model->subgraphs[0]->operators.size(), 3);

  auto dequantize_op = model->subgraphs[0]->operators[0].get();
  auto input = model->subgraphs[0]->tensors[dequantize_op->inputs[0]].get();
  EXPECT_EQ(input->name, "tensor_0_uint8");
  EXPECT_EQ(input->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(input->quantization->scale[0], 0.4);
  EXPECT_EQ(input->quantization->zero_point[0], 2);

  auto quantize_op = model->subgraphs[0]->operators[2].get();
  auto output = model->subgraphs[0]->tensors[quantize_op->outputs[0]].get();
  EXPECT_EQ(output->name, "tensor_1_uint8");
  EXPECT_EQ(output->type, TensorType_UINT8);
  EXPECT_FLOAT_EQ(output->quantization->scale[0], 0.5);
  EXPECT_EQ(output->quantization->zero_point[0], -5);
}

}  // namespace
}  // namespace optimize
}  // namespace tflite

int main(int argc, char** argv) {
  ::testing::InitGoogleTest(&argc, argv);
  return RUN_ALL_TESTS();
}