ONE/compiler_2luci-interpreter_2src_2kernels_2_quantize_8cpp_source.html

/*

 * Copyright (c) 2022 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *    http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "kernels/Quantize.h"

#include "kernels/Utils.h"

#include "PALQuantize.h"


namespace luci_interpreter

{

namespace kernels

{


namespace

{


template <typename input_dtype> void call_requantize(const Tensor *input, Tensor *output)

{

  int32_t multiplier;

  int shift;


  const double effective_output_scale = input->scale() / output->scale();

  quantizeMultiplier(effective_output_scale, &multiplier, &shift);


  const auto input_shape = getTensorShape(input);

  const auto output_shape = getTensorShape(output);

  const auto size = tflite::MatchingFlatSize(input_shape, output_shape);


  const auto input_data = getTensorData<input_dtype>(input);


  switch (output->element_type())

  {

    case loco::DataType::S8:

      luci_interpreter_pal::Requantize(input_data, size, multiplier, shift, input->zero_point(),

                                       output->zero_point(), getTensorData<int8_t>(output));

      break;

    case loco::DataType::U8:

      luci_interpreter_pal::Requantize(input_data, size, multiplier, shift, input->zero_point(),

                                       output->zero_point(), getTensorData<uint8_t>(output));

      break;

    case loco::DataType::S16:

      luci_interpreter_pal::Requantize(input_data, size, multiplier, shift, input->zero_point(),

                                       output->zero_point(), getTensorData<int16_t>(output));

      break;

    default:

      throw std::runtime_error("Unsupported quantized type, yet!");

  }

}


} // namespace


Quantize::Quantize(const Tensor *input, Tensor *output) : Kernel({input}, {output}) {}


void Quantize::configure()

{


  if (input()->element_type() == loco::DataType::S16)

    LUCI_INTERPRETER_CHECK(input()->zero_point() == 0);


  switch (input()->element_type())

  {

    case loco::DataType::FLOAT32:

    {

      LUCI_INTERPRETER_CHECK(output()->element_type() == loco::DataType::U8 ||

                             output()->element_type() == loco::DataType::S8 ||

                             output()->element_type() == loco::DataType::S16);

      break;

    }

    case loco::DataType::S16:

    case loco::DataType::S8:

    case loco::DataType::U8:

    {

      LUCI_INTERPRETER_CHECK(output()->element_type() == loco::DataType::S8 ||

                             output()->element_type() == loco::DataType::U8 ||

                             output()->element_type() == loco::DataType::S16);

      if (output()->element_type() == loco::DataType::S16)

      {

        LUCI_INTERPRETER_CHECK(output()->zero_point() == 0);

      }

      break;

    }

    default:

      throw std::runtime_error("Unsupported type");

  }


  output()->resize(input()->shape());

}

void Quantize::configure() {…}


void Quantize::execute() const

{

  switch (input()->element_type())

  {

    case loco::DataType::FLOAT32:

    {

      tflite::QuantizationParams op_params;

      op_params.zero_point = output()->zero_point();

      op_params.scale = output()->scale();

      const auto input_data = getTensorData<float>(input());


      switch (output()->element_type())

      {

        case loco::DataType::S8:

        {

          luci_interpreter_pal::Quantize(op_params, getTensorShape(input()), input_data,

                                         getTensorShape(output()), getTensorData<int8_t>(output()));

          break;

        }

        case loco::DataType::U8:

        {

          luci_interpreter_pal::Quantize(op_params, getTensorShape(input()), input_data,

                                         getTensorShape(output()),

                                         getTensorData<uint8_t>(output()));

          break;

        }

        case loco::DataType::S16:

        {

          luci_interpreter_pal::Quantize(op_params, getTensorShape(input()), input_data,

                                         getTensorShape(output()),

                                         getTensorData<int16_t>(output()));

          break;

        }

        default:

          throw std::runtime_error("luci-intp Quantize(1) Unsupported type.");

      }

      break;

    }

    case loco::DataType::S16:

    {

      call_requantize<int16_t>(input(), output());

      break;

    }

    case loco::DataType::S8:

    {

      call_requantize<int8_t>(input(), output());

      break;

    }

    case loco::DataType::U8:

    {

      call_requantize<uint8_t>(input(), output());

      break;

    }

    default:

      throw std::runtime_error("luci-intp Quantize(2) Unsupported type.");

  }

}

void Quantize::execute() const {…}


} // namespace kernels

} // namespace luci_interpreter

Tensor
Definition tensor_gen.cpp:32

luci_interpreter::Kernel
Definition Kernel.h:29

luci_interpreter::Tensor
Definition Tensor.h:101

luci_interpreter::Tensor::resize
void resize(const Shape &new_shape)
Definition Tensor.cpp:56

luci_interpreter::Tensor::scale
float scale() const
Definition Tensor.h:109

luci_interpreter::Tensor::zero_point
int32_t zero_point() const
Definition Tensor.h:115

luci_interpreter::kernels::Quantize::input
const Tensor * input() const
Definition Quantize.h:33

luci_interpreter::kernels::Quantize::execute
void execute() const override
Definition Quantize.cpp:101

luci_interpreter::kernels::Quantize::configure
void configure() override
Definition Quantize.cpp:66

luci_interpreter::kernels::Quantize::Quantize
Quantize(const Tensor *input, Tensor *output)
Definition Quantize.cpp:64

luci_interpreter::kernels::Quantize::output
Tensor * output() const
Definition Quantize.h:34

Quantize.h

LUCI_INTERPRETER_CHECK
#define LUCI_INTERPRETER_CHECK(cond)
Definition Utils.h:36

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

gen_h5_explicit_inputs_all.output
output
Definition gen_h5_explicit_inputs_all.py:96

infer.input_data
list input_data
Definition infer.py:29

luci_interpreter::kernels::getTensorShape
tflite::RuntimeShape getTensorShape(const Tensor *tensor)
Definition Utils.h:194

luci_interpreter::kernels::quantizeMultiplier
void quantizeMultiplier(double double_multiplier, int32_t *quantized_multiplier, int *shift)
Definition Utils.cpp:157

luci_interpreter
Definition BuddyMemoryManager.h:22

mir_caffe::CaffeOpType::input
@ input

mir_interpreter::shift
Index shift(const Index &in_index, const Shape &shift_from)
Definition Common.cpp:26

size
int32_t size[5]
Definition Slice.cpp:35