ONE/cpu_2ops_2_binary_arithmetic_layer_8cc_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "BinaryArithmeticLayer.h"


#include <cker/operation/BinaryArithmeticOps.h>


namespace onert::backend::cpu::ops

{


namespace

{


template <nnfw::cker::BinaryArithmeticOpType arithmetic_type, typename T> struct Eval

{

  nnfw::cker::Shape _lhs_shape;

  nnfw::cker::Shape _rhs_shape;

  nnfw::cker::Shape _output_shape;

  nnfw::cker::BinaryArithmeticOpParam _op_params;

  bool _need_broadcast;


  Eval(const IPortableTensor *lhs, const IPortableTensor *rhs, IPortableTensor *output,

       nnfw::cker::BinaryArithmeticOpParam op_params)

    : _op_params(std::move(op_params)), _need_broadcast(false)

  {

    if (!output->is_dynamic())

      updateCache(lhs, rhs, output);

  }


  void updateCache(const IPortableTensor *lhs, const IPortableTensor *rhs, IPortableTensor *output)

  {

    _lhs_shape.ReplaceWith(getShape(lhs));

    _rhs_shape.ReplaceWith(getShape(rhs));

    _output_shape.ReplaceWith(getShape(output));

    _need_broadcast = nnfw::cker::ProcessBroadcastShapes(_lhs_shape, _rhs_shape, &_op_params);

  }


  void operator()(const IPortableTensor *lhs, const IPortableTensor *rhs, IPortableTensor *output)

  {

    // Assume dynamic tensors never become static and static ones never change shape since

    // configure()

    if (output->is_dynamic())

      updateCache(lhs, rhs, output);

    else

      assert(_lhs_shape == getShape(lhs) && _rhs_shape == getShape(rhs) &&

             _output_shape == getShape(output));

    auto lhs_buffer = getBuffer<T>(lhs);

    auto rhs_buffer = getBuffer<T>(rhs);

    auto output_buffer = getBuffer<T>(output);

    if (_need_broadcast)

    {

      nnfw::cker::BroadcastBinaryArithmeticOp<arithmetic_type>(

        _op_params, _lhs_shape, lhs_buffer, _rhs_shape, rhs_buffer, _output_shape, output_buffer);

    }

    else

    {

      nnfw::cker::BinaryArithmeticOp<arithmetic_type>(

        _op_params, _lhs_shape, lhs_buffer, _rhs_shape, rhs_buffer, _output_shape, output_buffer);

    }

  }

};


template <nnfw::cker::BinaryArithmeticOpType arithmetic_type>

std::function<void(const IPortableTensor *, const IPortableTensor *, IPortableTensor *)>

generateKernelGeneric(const IPortableTensor *lhs, const IPortableTensor *rhs,

                      IPortableTensor *output, const ir::Activation activation,

                      nnfw::cker::BinaryArithmeticOpParam &op_params)

{

  switch (lhs->data_type())

  {

    case OperandType::FLOAT32:

    {

      float output_activation_min = 0, output_activation_max = 0;

      CalculateActivationRange(activation, &output_activation_min, &output_activation_max);

      op_params.float_activation_max = output_activation_max;

      op_params.float_activation_min = output_activation_min;

      return Eval<arithmetic_type, float>(lhs, rhs, output, op_params);

      break;

    }

    case OperandType::INT32:

    {

      int32_t output_activation_min = 0, output_activation_max = 0;

      CalculateActivationRange(activation, &output_activation_min, &output_activation_max);

      op_params.quantized_activation_max = output_activation_max;

      op_params.quantized_activation_min = output_activation_min;

      return Eval<arithmetic_type, int32_t>(lhs, rhs, output, op_params);

      break;

    }

    case OperandType::INT64:

    {

      int64_t output_activation_min = 0, output_activation_max = 0;

      CalculateActivationRange(activation, &output_activation_min, &output_activation_max);

      op_params.int64_activation_max = output_activation_max;

      op_params.int64_activation_min = output_activation_min;

      return Eval<arithmetic_type, int64_t>(lhs, rhs, output, op_params);

      break;

    }

    case OperandType::BOOL8:

    {

      if (activation != ir::Activation::NONE)

        throw std::runtime_error(

          "BinaryArithmetic(generic): Fused activation is not supported with bool8 type");

      int32_t output_activation_min = 0, output_activation_max = 0;

      CalculateActivationRange(activation, &output_activation_min, &output_activation_max);

      static_assert(sizeof(bool) == 1, "cpu backend supports bool type which is 1 byte");

      return Eval<arithmetic_type, bool>(lhs, rhs, output, op_params);

      break;

    }

    default:

      throw std::runtime_error{"BinaryArithmetic(generic): Unsupported data type"};

  }

}


void setAddOrSubQuant8Params(const IPortableTensor *lhs, const IPortableTensor *rhs,

                             IPortableTensor *output, ir::Activation activation,

                             nnfw::cker::BinaryArithmeticOpParam *params)

{

  int32_t output_activation_min, output_activation_max;

  CalculateActivationRangeQuantized(activation, output, &output_activation_min,

                                    &output_activation_max);

  nnfw::cker::BinaryArithmeticOpParam &op_params = *params;

  op_params.quantized_activation_max = output_activation_max;

  op_params.quantized_activation_min = output_activation_min;

  // Parameters for scaled quantized computation

  op_params.left_shift = 20;

  // Zero-points of input and output tensors

  op_params.input1_offset = -lhs->data_zero_point();

  op_params.input2_offset = -rhs->data_zero_point();

  op_params.output_offset = output->data_zero_point();


  // Compute normalized scale for _lhs and _rhs values,

  // and represent in 32-bit fixed point

  const double norm_max_scale = 2 * std::max(lhs->data_scale(), rhs->data_scale());

  const double real_lhs_scale = lhs->data_scale() / norm_max_scale;

  const double real_rhs_scale = rhs->data_scale() / norm_max_scale;

  // output scale is used to normalize final result, so we invert the scale here

  const double real_output_scale =

    norm_max_scale / (output->data_scale() * (1 << op_params.left_shift));


  // Represent the scales as fixed int32_t multipliers, and int32_t shifts

  QuantizeMultiplier(real_lhs_scale, &op_params.input1_multiplier, &op_params.input1_shift);

  QuantizeMultiplier(real_rhs_scale, &op_params.input2_multiplier, &op_params.input2_shift);

  QuantizeMultiplier(real_output_scale, &op_params.output_multiplier, &op_params.output_shift);

}


void setMulQuant8Params(const IPortableTensor *lhs, const IPortableTensor *rhs,

                        IPortableTensor *output, ir::Activation activation,

                        nnfw::cker::BinaryArithmeticOpParam *params)

{

  int32_t output_activation_min, output_activation_max;

  CalculateActivationRangeQuantized(activation, output, &output_activation_min,

                                    &output_activation_max);

  nnfw::cker::BinaryArithmeticOpParam &op_params = *params;


  op_params.quantized_activation_max = output_activation_max;

  op_params.quantized_activation_min = output_activation_min;

  op_params.input1_offset = -lhs->data_zero_point();

  op_params.input2_offset = -rhs->data_zero_point();

  op_params.output_offset = output->data_zero_point();


  double real_multiplier = lhs->data_scale() * rhs->data_scale() / output->data_scale();

  QuantizeMultiplier(real_multiplier, &op_params.output_multiplier, &op_params.output_shift);

}


} // namespace


void BinaryArithmeticLayer::configure(const IPortableTensor *lhs, const IPortableTensor *rhs,

                                      IPortableTensor *output, const ir::Activation activation,

                                      const ArithmeticType arithmetic_type)

{

  assert(lhs != nullptr);

  assert(rhs != nullptr);

  assert(output != nullptr);


  _lhs = lhs;

  _rhs = rhs;

  _output = output;


  nnfw::cker::BinaryArithmeticOpParam op_params;

  switch (arithmetic_type)

  {

    case ArithmeticType::kAdd:

      if (_lhs->data_type() == OperandType::QUANT_UINT8_ASYMM)

      {

        setAddOrSubQuant8Params(_lhs, _rhs, _output, activation, &op_params);

        _kernel =

          Eval<nnfw::cker::BinaryArithmeticOpType::ADD, uint8_t>(_lhs, _rhs, _output, op_params);

      }

      else if (_lhs->data_type() == OperandType::QUANT_INT8_ASYMM)

      {

        setAddOrSubQuant8Params(_lhs, _rhs, _output, activation, &op_params);

        _kernel =

          Eval<nnfw::cker::BinaryArithmeticOpType::ADD, int8_t>(_lhs, _rhs, _output, op_params);

      }


      else

      {

        _kernel = generateKernelGeneric<nnfw::cker::BinaryArithmeticOpType::ADD>(

          _lhs, _rhs, _output, activation, op_params);

      }

      break;

    case ArithmeticType::kSub:

      if (_lhs->data_type() == OperandType::QUANT_UINT8_ASYMM)

      {

        setAddOrSubQuant8Params(_lhs, _rhs, _output, activation, &op_params);

        op_params.input2_multiplier *= -1;

        _kernel =

          Eval<nnfw::cker::BinaryArithmeticOpType::SUB, uint8_t>(_lhs, _rhs, _output, op_params);

      }

      else if (_lhs->data_type() == OperandType::QUANT_INT8_ASYMM)

      {

        setAddOrSubQuant8Params(_lhs, _rhs, _output, activation, &op_params);

        op_params.input2_multiplier *= -1;

        _kernel =

          Eval<nnfw::cker::BinaryArithmeticOpType::SUB, int8_t>(_lhs, _rhs, _output, op_params);

      }


      else

      {

        _kernel = generateKernelGeneric<nnfw::cker::BinaryArithmeticOpType::SUB>(

          _lhs, _rhs, _output, activation, op_params);

      }

      break;

    case ArithmeticType::kMul:

      if (_lhs->data_type() == OperandType::QUANT_UINT8_ASYMM)

      {

        nnfw::cker::BinaryArithmeticOpParam op_params;

        setMulQuant8Params(_lhs, _rhs, _output, activation, &op_params);

        _kernel =

          Eval<nnfw::cker::BinaryArithmeticOpType::MUL, uint8_t>(_lhs, _rhs, _output, op_params);

      }

      else if (_lhs->data_type() == OperandType::QUANT_INT8_ASYMM)

      {

        nnfw::cker::BinaryArithmeticOpParam op_params;

        setMulQuant8Params(_lhs, _rhs, _output, activation, &op_params);

        _kernel =

          Eval<nnfw::cker::BinaryArithmeticOpType::MUL, int8_t>(_lhs, _rhs, _output, op_params);

      }

      else

      {

        _kernel = generateKernelGeneric<nnfw::cker::BinaryArithmeticOpType::MUL>(

          _lhs, _rhs, _output, activation, op_params);

      }

      break;

    case ArithmeticType::kDiv:

      if (_lhs->data_type() == OperandType::FLOAT32)

      {

        _kernel = generateKernelGeneric<nnfw::cker::BinaryArithmeticOpType::DIV>(

          _lhs, _rhs, _output, activation, op_params);

      }

      else

      {

        // TODO Support quantized type

        // TODO Support integer type with zero check

        throw std::runtime_error{

          "BinaryArithmetic(Div): Div operation does not support non-float data types yet"};

      }

      break;

    default:

      throw std::runtime_error{"BinaryArithmetic: Unsupported BinaryArithmetic type"};

  }

}


void BinaryArithmeticLayer::run() { _kernel(_lhs, _rhs, _output); }


} // namespace onert::backend::cpu::ops

BinaryArithmeticOps.h

nnfw::cker::Shape
Definition Shape.h:35

nnfw::cker::Shape::ReplaceWith
void ReplaceWith(int dimensions_count, const int32_t *dims_data)
Definition Shape.h:206

onert::backend::IPortableTensor
A tensor class that is portable for other backends.
Definition IPortableTensor.h:37

onert::backend::IPortableTensor::data_type
ir::DataType data_type() const override final
Definition IPortableTensor.h:54

onert::backend::cpu::ops::BinaryArithmeticLayer::run
void run() override
Definition BinaryArithmeticLayer.cc:277

onert::backend::cpu::ops::BinaryArithmeticLayer::_kernel
std::function< void(const IPortableTensor *, const IPortableTensor *, IPortableTensor *)> _kernel
Definition BinaryArithmeticLayer.h:55

onert::backend::cpu::ops::BinaryArithmeticLayer::_rhs
const IPortableTensor * _rhs
Definition BinaryArithmeticLayer.h:52

onert::backend::cpu::ops::BinaryArithmeticLayer::_lhs
const IPortableTensor * _lhs
Definition BinaryArithmeticLayer.h:51

onert::backend::cpu::ops::BinaryArithmeticLayer::configure
void configure(const IPortableTensor *lhs, const IPortableTensor *rhs, IPortableTensor *output, const ir::Activation activation, const ArithmeticType arithmetic_type)
Definition BinaryArithmeticLayer.cc:180

onert::backend::cpu::ops::BinaryArithmeticLayer::_output
IPortableTensor * _output
Definition BinaryArithmeticLayer.h:53

_output_shape
nnfw::cker::Shape _output_shape
Definition BinaryArithmeticLayer.cc:31

_rhs_shape
nnfw::cker::Shape _rhs_shape
Definition BinaryArithmeticLayer.cc:30

_op_params
nnfw::cker::BinaryArithmeticOpParam _op_params
Definition BinaryArithmeticLayer.cc:32

_lhs_shape
nnfw::cker::Shape _lhs_shape
Definition BinaryArithmeticLayer.cc:29

_need_broadcast
bool _need_broadcast
Definition BinaryArithmeticLayer.cc:33

gen_h5_explicit_inputs_all.output
output
Definition gen_h5_explicit_inputs_all.py:96

nnfw::cker::ProcessBroadcastShapes
bool ProcessBroadcastShapes(const Shape &shape0, const Shape &shape1, BinaryArithmeticOpParam *params)
Definition BinaryArithmeticOps.h:107

onert::backend::cpu::ops
Definition AddNLayer.cc:25

onert::backend::cpu::ops::getShape
nnfw::cker::Shape getShape(const IPortableTensor *tensor)
Definition OperationUtils.h:89

onert::backend::cpu::ops::QuantizeMultiplier
void QuantizeMultiplier(double double_multiplier, int32_t *quantized_multiplier, int *shift)
Definition OperationUtils.cc:56

onert::backend::cpu::ops::CalculateActivationRangeQuantized
void CalculateActivationRangeQuantized(ir::Activation activation, const IPortableTensor *output, int32_t *act_min, int32_t *act_max)
Definition OperationUtils.cc:138

onert::backend::cpu::ops::ArithmeticType
ArithmeticType
Definition BinaryArithmeticLayer.h:29

onert::backend::cpu::ops::ArithmeticType::kMul
@ kMul

onert::backend::cpu::ops::ArithmeticType::kDiv
@ kDiv

onert::backend::cpu::ops::ArithmeticType::kAdd
@ kAdd

onert::backend::cpu::ops::ArithmeticType::kSub
@ kSub

onert::ir::Activation
Activation
Definition InternalType.h:26

onert::ir::Activation::NONE
@ NONE

onert::util::CalculateActivationRange
void CalculateActivationRange(ir::Activation activation, T *activation_min, T *activation_max)
Definition CalculateActivationRange.h:28

std
Definition CircleExporterUtils.h:53

nnfw::cker::BinaryArithmeticOpParam
Definition Types.h:179

nnfw::cker::BinaryArithmeticOpParam::output_shift
int32_t output_shift
Definition Types.h:187

nnfw::cker::BinaryArithmeticOpParam::quantized_activation_max
int32_t quantized_activation_max
Definition Types.h:196

nnfw::cker::BinaryArithmeticOpParam::input1_shift
int32_t input1_shift
Definition Types.h:191

nnfw::cker::BinaryArithmeticOpParam::input1_offset
int32_t input1_offset
Definition Types.h:183

nnfw::cker::BinaryArithmeticOpParam::int64_activation_min
int64_t int64_activation_min
Definition Types.h:200

nnfw::cker::BinaryArithmeticOpParam::output_offset
int32_t output_offset
Definition Types.h:185

nnfw::cker::BinaryArithmeticOpParam::input2_shift
int32_t input2_shift
Definition Types.h:193

nnfw::cker::BinaryArithmeticOpParam::input2_multiplier
int32_t input2_multiplier
Definition Types.h:192

nnfw::cker::BinaryArithmeticOpParam::quantized_activation_min
int32_t quantized_activation_min
Definition Types.h:195

nnfw::cker::BinaryArithmeticOpParam::input2_offset
int32_t input2_offset
Definition Types.h:184

nnfw::cker::BinaryArithmeticOpParam::float_activation_max
float float_activation_max
Definition Types.h:199

nnfw::cker::BinaryArithmeticOpParam::output_multiplier
int32_t output_multiplier
Definition Types.h:186

nnfw::cker::BinaryArithmeticOpParam::input1_multiplier
int32_t input1_multiplier
Definition Types.h:190

nnfw::cker::BinaryArithmeticOpParam::left_shift
int32_t left_shift
Definition Types.h:189

nnfw::cker::BinaryArithmeticOpParam::int64_activation_max
int64_t int64_activation_max
Definition Types.h:201

nnfw::cker::BinaryArithmeticOpParam::float_activation_min
float float_activation_min
Definition Types.h:198

BinaryArithmeticLayer.h