ONE/reference_2_binary_arithmetic_ops_8h_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 * Copyright 2017 The TensorFlow Authors. All Rights Reserved.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef __NNFW_CKER_REFERENCE_BINARYARITHMETICOPS_H__

#define __NNFW_CKER_REFERENCE_BINARYARITHMETICOPS_H__


#include "cker/Shape.h"

#include "cker/Types.h"

#include "cker/Utils.h"


#include <cmath>


namespace nnfw

{

namespace cker

{

namespace reference

{


template <typename T>


inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &params, const Shape &input1_shape,

                               const T *input1_data, const Shape &input2_shape,

                               const T *input2_data, const Shape &output_shape, T *output_data,

                               const std::function<T(const T &, const T &)> &fn)

{

  const int32_t flat_size = MatchingElementsSize(input1_shape, input2_shape, output_shape);

  for (int i = 0; i < flat_size; ++i)

  {

    output_data[i] = ActivationFunctionWithMinMax(fn(input1_data[i], input2_data[i]),

                                                  params.quantized_activation_min,

                                                  params.quantized_activation_max);

  }

}

inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &params, const Shape &input1_shape, {…}


template <>


inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &params, const Shape &input1_shape,

                               const float *input1_data, const Shape &input2_shape,

                               const float *input2_data, const Shape &output_shape,

                               float *output_data,

                               const std::function<float(const float &, const float &)> &fn)

{

  const int size = MatchingElementsSize(input1_shape, input2_shape, output_shape);

  for (int i = 0; i < size; i++)

  {

    output_data[i] = ActivationFunctionWithMinMax(

      fn(input1_data[i], input2_data[i]), params.float_activation_min, params.float_activation_max);

  }

}

inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &params, const Shape &input1_shape, {…}


template <>


inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &, const Shape &input1_shape,

                               const bool *input1_data, const Shape &input2_shape,

                               const bool *input2_data, const Shape &output_shape,

                               bool *output_data,

                               const std::function<bool(const bool &, const bool &)> &fn)

{

  const int size = MatchingElementsSize(input1_shape, input2_shape, output_shape);

  for (int i = 0; i < size; i++)

  {

    output_data[i] = fn(input1_data[i], input2_data[i]);

  }

}

inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &, const Shape &input1_shape, {…}


template <>


inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &params, const Shape &input1_shape,

                               const int64_t *input1_data, const Shape &input2_shape,

                               const int64_t *input2_data, const Shape &output_shape,

                               int64_t *output_data,

                               const std::function<int64_t(const int64_t &, const int64_t &)> &fn)

{

  const int flat_size = MatchingElementsSize(input1_shape, input2_shape, output_shape);

  for (int i = 0; i < flat_size; ++i)

  {

    output_data[i] = ActivationFunctionWithMinMax(

      fn(input1_data[i], input2_data[i]), params.int64_activation_min, params.int64_activation_max);

  }

}

inline void BinaryArithmeticOp(const BinaryArithmeticOpParam &params, const Shape &input1_shape, {…}


template <typename T>


inline typename std::enable_if_t<is_quant8<T>::value> BroadcastBinaryArithmeticOpSlow(

  const BinaryArithmeticOpParam &params, const Shape &input1_shape, const T *input1_data,

  const Shape &input2_shape, const T *input2_data, const Shape &output_shape, T *output_data,

  const std::function<T(const BinaryArithmeticOpParam &params, const T &, const T &)> &fn)

{

  NdArrayDesc<4> desc1;

  NdArrayDesc<4> desc2;

  NdArrayDescsForElementwiseBroadcast(input1_shape, input2_shape, &desc1, &desc2);

  const Shape extended_output_shape = Shape::ExtendedShape(4, output_shape);


  // Comment from tensorflow lite:

  //

  // In Tensorflow, the dimensions are canonically named (batch_number, row,

  // col, channel), with extents (batches, height, width, depth), with the

  // trailing dimension changing most rapidly (channels has the smallest stride,

  // typically 1 element).

  //

  // In generated C code, we store arrays with the dimensions reversed. The

  // first dimension has smallest stride.

  //

  // We name our variables by their Tensorflow convention, but generate C code

  // nesting loops such that the innermost loop has the smallest stride for the

  // best cache behavior.

  for (int b = 0; b < extended_output_shape.Dims(0); ++b)

  {

    for (int y = 0; y < extended_output_shape.Dims(1); ++y)

    {

      for (int x = 0; x < extended_output_shape.Dims(2); ++x)

      {

        for (int c = 0; c < extended_output_shape.Dims(3); ++c)

        {

          output_data[Offset(extended_output_shape, b, y, x, c)] = ActivationFunctionWithMinMax<T>(

            fn(params, input1_data[SubscriptToIndex(desc1, b, y, x, c)],

               input2_data[SubscriptToIndex(desc2, b, y, x, c)]),

            params.quantized_activation_min, params.quantized_activation_max);

        }

      }

    }

  }

}

inline typename std::enable_if_t<is_quant8<T>::value> BroadcastBinaryArithmeticOpSlow( {…}

template <typename T>


inline void BroadcastBinaryArithmeticOpSlow(const BinaryArithmeticOpParam &params,

                                            const Shape &input1_shape, const T *input1_data,

                                            const Shape &input2_shape, const T *input2_data,

                                            const Shape &output_shape, T *output_data,

                                            const std::function<T(const T &, const T &)> &fn)

{

  NdArrayDesc<4> desc1;

  NdArrayDesc<4> desc2;

  NdArrayDescsForElementwiseBroadcast(input1_shape, input2_shape, &desc1, &desc2);

  const Shape extended_output_shape = Shape::ExtendedShape(4, output_shape);


  // Comment from tensorflow lite:

  //

  // In Tensorflow, the dimensions are canonically named (batch_number, row,

  // col, channel), with extents (batches, height, width, depth), with the

  // trailing dimension changing most rapidly (channels has the smallest stride,

  // typically 1 element).

  //

  // In generated C code, we store arrays with the dimensions reversed. The

  // first dimension has smallest stride.

  //

  // We name our variables by their Tensorflow convention, but generate C code

  // nesting loops such that the innermost loop has the smallest stride for the

  // best cache behavior.

  for (int b = 0; b < extended_output_shape.Dims(0); ++b)

  {

    for (int y = 0; y < extended_output_shape.Dims(1); ++y)

    {

      for (int x = 0; x < extended_output_shape.Dims(2); ++x)

      {

        for (int c = 0; c < extended_output_shape.Dims(3); ++c)

        {

          output_data[Offset(extended_output_shape, b, y, x, c)] = ActivationFunctionWithMinMax<T>(

            fn(input1_data[SubscriptToIndex(desc1, b, y, x, c)],

               input2_data[SubscriptToIndex(desc2, b, y, x, c)]),

            params.quantized_activation_min, params.quantized_activation_max);

        }

      }

    }

  }

}

inline void BroadcastBinaryArithmeticOpSlow(const BinaryArithmeticOpParam &params, {…}


template <>


inline void BroadcastBinaryArithmeticOpSlow(

  const BinaryArithmeticOpParam &params, const Shape &input1_shape, const float *input1_data,

  const Shape &input2_shape, const float *input2_data, const Shape &output_shape,

  float *output_data, const std::function<float(const float &, const float &)> &fn)

{

  NdArrayDesc<4> desc1;

  NdArrayDesc<4> desc2;

  NdArrayDescsForElementwiseBroadcast(input1_shape, input2_shape, &desc1, &desc2);

  const Shape extended_output_shape = Shape::ExtendedShape(4, output_shape);


  for (int b = 0; b < extended_output_shape.Dims(0); ++b)

  {

    for (int y = 0; y < extended_output_shape.Dims(1); ++y)

    {

      for (int x = 0; x < extended_output_shape.Dims(2); ++x)

      {

        for (int c = 0; c < extended_output_shape.Dims(3); ++c)

        {

          output_data[Offset(extended_output_shape, b, y, x, c)] =

            ActivationFunctionWithMinMax(fn(input1_data[SubscriptToIndex(desc1, b, y, x, c)],

                                            input2_data[SubscriptToIndex(desc2, b, y, x, c)]),

                                         params.float_activation_min, params.float_activation_max);

        }

      }

    }

  }

}

inline void BroadcastBinaryArithmeticOpSlow( {…}


template <>


inline void BroadcastBinaryArithmeticOpSlow(

  const BinaryArithmeticOpParam &, const Shape &input1_shape, const bool *input1_data,

  const Shape &input2_shape, const bool *input2_data, const Shape &output_shape, bool *output_data,

  const std::function<bool(const bool &, const bool &)> &fn)

{

  NdArrayDesc<4> desc1;

  NdArrayDesc<4> desc2;

  NdArrayDescsForElementwiseBroadcast(input1_shape, input2_shape, &desc1, &desc2);

  const Shape extended_output_shape = Shape::ExtendedShape(4, output_shape);


  for (int b = 0; b < extended_output_shape.Dims(0); ++b)

  {

    for (int y = 0; y < extended_output_shape.Dims(1); ++y)

    {

      for (int x = 0; x < extended_output_shape.Dims(2); ++x)

      {

        for (int c = 0; c < extended_output_shape.Dims(3); ++c)

        {

          output_data[Offset(extended_output_shape, b, y, x, c)] =

            fn(input1_data[SubscriptToIndex(desc1, b, y, x, c)],

               input2_data[SubscriptToIndex(desc2, b, y, x, c)]);

        }

      }

    }

  }

}

inline void BroadcastBinaryArithmeticOpSlow( {…}


template <>


inline void BroadcastBinaryArithmeticOpSlow(

  const BinaryArithmeticOpParam &params, const Shape &input1_shape, const int64_t *input1_data,

  const Shape &input2_shape, const int64_t *input2_data, const Shape &output_shape,

  int64_t *output_data, const std::function<int64_t(const int64_t &, const int64_t &)> &fn)

{

  NdArrayDesc<4> desc1;

  NdArrayDesc<4> desc2;

  NdArrayDescsForElementwiseBroadcast(input1_shape, input2_shape, &desc1, &desc2);

  const Shape extended_output_shape = Shape::ExtendedShape(4, output_shape);


  for (int b = 0; b < extended_output_shape.Dims(0); ++b)

  {

    for (int y = 0; y < extended_output_shape.Dims(1); ++y)

    {

      for (int x = 0; x < extended_output_shape.Dims(2); ++x)

      {

        for (int c = 0; c < extended_output_shape.Dims(3); ++c)

        {

          output_data[Offset(extended_output_shape, b, y, x, c)] =

            ActivationFunctionWithMinMax(fn(input1_data[SubscriptToIndex(desc1, b, y, x, c)],

                                            input2_data[SubscriptToIndex(desc2, b, y, x, c)]),

                                         params.int64_activation_min, params.int64_activation_max);

        }

      }

    }

  }

}

inline void BroadcastBinaryArithmeticOpSlow( {…}


} // namespace reference

} // namespace cker

} // namespace nnfw


#endif // __NNFW_CKER_REFERENCE_BINARYARITHMETICOPS_H__

nnfw::cker::Shape
Definition Shape.h:32

nnfw::cker::Shape::Dims
int32_t Dims(int i) const
Definition Shape.h:92

desc1
NdArrayDesc< 4 > desc1
Definition PALComparisons.h:33

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

desc2
NdArrayDesc< 4 > desc2
Definition PALComparisons.h:34

nnfw::cker::reference::BroadcastBinaryArithmeticOpSlow
std::enable_if_t< is_quant8< T >::value > BroadcastBinaryArithmeticOpSlow(const BinaryArithmeticOpParam &params, const Shape &input1_shape, const T *input1_data, const Shape &input2_shape, const T *input2_data, const Shape &output_shape, T *output_data, const std::function< T(const BinaryArithmeticOpParam &params, const T &, const T &)> &fn)
Definition BinaryArithmeticOps.h:94

nnfw::cker::reference::BinaryArithmeticOp
void BinaryArithmeticOp(const BinaryArithmeticOpParam &params, const Shape &input1_shape, const T *input1_data, const Shape &input2_shape, const T *input2_data, const Shape &output_shape, T *output_data, const std::function< T(const T &, const T &)> &fn)
Definition BinaryArithmeticOps.h:35

nnfw::cker::Offset
int Offset(const Shape &shape, int i0, int i1, int i2, int i3)
Definition Shape.h:237

nnfw::cker::NdArrayDescsForElementwiseBroadcast
void NdArrayDescsForElementwiseBroadcast(const Shape &input0_shape, const Shape &input1_shape, NdArrayDesc< N > *desc0_out, NdArrayDesc< N > *desc1_out)
Definition Utils.h:290

nnfw::cker::ActivationFunctionWithMinMax
T ActivationFunctionWithMinMax(T x, T output_activation_min, T output_activation_max)
Definition Utils.h:43

nnfw::cker::MatchingElementsSize
int MatchingElementsSize(const Shape &shape, const Shape &check_shape_0, const Shape &check_shape_1)
Definition Shape.h:334

nnfw::cker::SubscriptToIndex
int SubscriptToIndex(const NdArrayDesc< 4 > &desc, int i0, int i1, int i2, int i3)
Definition Utils.h:255

nnfw
Definition topk_v2.h:30

size
int32_t size[5]
Definition Slice.cpp:35

Shape.h

Types.h

Utils.h

nnfw::cker::BinaryArithmeticOpParam
Definition Types.h:179

nnfw::cker::BinaryArithmeticOpParam::quantized_activation_max
int32_t quantized_activation_max
Definition Types.h:196

nnfw::cker::BinaryArithmeticOpParam::int64_activation_min
int64_t int64_activation_min
Definition Types.h:200

nnfw::cker::BinaryArithmeticOpParam::quantized_activation_min
int32_t quantized_activation_min
Definition Types.h:195

nnfw::cker::BinaryArithmeticOpParam::float_activation_max
float float_activation_max
Definition Types.h:199

nnfw::cker::BinaryArithmeticOpParam::int64_activation_max
int64_t int64_activation_max
Definition Types.h:201

nnfw::cker::BinaryArithmeticOpParam::float_activation_min
float float_activation_min
Definition Types.h:198

nnfw::cker::NdArrayDesc
Definition Utils.h:239