ONE/luci-interpreter_2pal_2common_2_p_a_l_tanh_8h_source.html

/*

 * Copyright (c) 2023 Samsung Electronics Co., Ltd. All Rights Reserved

 * Copyright 2020 The TensorFlow Authors. All Rights Reserved.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *    http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef LUCI_INTERPRETER_PAL_TANH_H

#define LUCI_INTERPRETER_PAL_TANH_H


#include "PALUtils.h"


namespace luci_interpreter_pal

{


inline void Tanh(const int flat_size, const float *input_data, float *output_data)

{

  for (int i = 0; i < flat_size; i++)

  {

    float val = input_data[i];

    float result = std::tanh(val);

    output_data[i] = result;

  }

}

inline void Tanh(const int flat_size, const float *input_data, float *output_data) {…}


inline void Tanh(int32_t input_multiplier, int32_t input_left_shift, const int flat_size,

                 const int16_t *ptr_input_data, int16_t *ptr_output_data)

{

  // We use the LUT for sigmoid and take into account, that

  // tanh(x) = 2*sigmoid(2*x) - 1


  // We scale by 3/4 to expand range [-8,8]->[-10.7,10.7].

  // In case of general parameter scale, multiplier 3 is taken into account

  // in TanhPrepare function and it is included in

  // input_multiplier already.


  if (input_multiplier == 0)

  { // power of two case

    input_multiplier = 3 << input_left_shift;

    input_left_shift = 0;

  }


  int32_t round = (input_left_shift > 0) ? 1 << (input_left_shift - 1) : 0;


  for (int i = 0; i < flat_size; ++i, ptr_input_data++, ptr_output_data++)

  {

    int32_t input_data = ((*ptr_input_data) * input_multiplier + round) >> input_left_shift;


    uint32_t abs_input_data = abs(input_data);

    uint32_t uh = abs_input_data >> 8;

    int32_t result;


    if (uh >= 255)

    {

      // Saturate to maximum.

      result = 0xFFFF << 8;

    }

    else

    {

      uint32_t ua = sigmoid_table_uint16[uh];

      uint32_t ub = sigmoid_table_uint16[uh + 1];


      uint8_t ut = abs_input_data & 0xFF;


      result = (ua << 8) + ut * (ub - ua);

    }


    result = (input_data >= 0) ? (result - (1 << (14 + 9)) + (1 << (9 - 2)))

                               : (-result + (1 << (14 + 9)) + (1 << (9 - 2)) - 1);


    // Convert back to 16-bit.

    result >>= (9 - 1);


    *ptr_output_data = result;

  }

}

inline void Tanh(int32_t input_multiplier, int32_t input_left_shift, const int flat_size, {…}


#if 0

inline void Tanh(int32_t input_zero_point, int32_t input_range_radius,

                 int32_t input_multiplier, int32_t input_shift,

                 const int flat_size, const int8_t* input_data, int8_t* output_data) {

  // Integer bits must be in sync with Prepare() function.

  static constexpr int32_t kInputIntegerBits = 4;

  static constexpr int32_t kOutputScale = 7;

  static constexpr int32_t kMinInt8 = std::numeric_limits<int8_t>::min();

  static constexpr int32_t kMaxInt8 = std::numeric_limits<int8_t>::max();


  for (int i = 0; i < flat_size; ++i) {

    const int32_t input =

      static_cast<int32_t>(input_data[i]) - input_zero_point;

    if (input <= -input_range_radius) {

      output_data[i] = kMinInt8;

    } else if (input >= input_range_radius) {

      output_data[i] = kMaxInt8;

    } else {

      const int32_t input_in_q4 =

        multiplyByQuantizedMultiplier(input, input_multiplier, input_shift);

      const int32_t output_in_q0 = std::tanh(input_in_q4);


      int32_t output_in_q24 =

        roundingDivideByPOT(output_in_q0, 31 - kOutputScale);

      output_in_q24 = std::min(std::max(output_in_q24, kMinInt8), kMaxInt8);

      output_data[i] = static_cast<int8_t>(output_in_q24);

    }

  }

}

#endif // 0


} // namespace luci_interpreter_pal


#endif // LUCI_INTERPRETER_PAL_TANH_H

luci_interpreter_pal
Definition PALArgMax.h:23

luci_interpreter_pal::Tanh
void Tanh(const int flat_size, const float *input_data, float *output_data)
Definition PALTanh.h:26

luci_interpreter_pal::roundingDivideByPOT
int32_t roundingDivideByPOT(int32_t x, int32_t exponent)
Definition PALUtils.h:65

luci_interpreter_pal::multiplyByQuantizedMultiplier
int32_t multiplyByQuantizedMultiplier(int32_t x, int32_t quantized_multiplier, int shift)
Definition PALUtils.h:77

part_eval_one.output_data
output_data
Definition part_eval_one.py:112

PALUtils.h