ONE/compiler_2luci-interpreter_2src_2kernels_2_instance_norm_8cpp_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *    http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "kernels/InstanceNorm.h"


#include "kernels/Utils.h"


#include <tensorflow/lite/kernels/internal/common.h>

#include <cmath>


namespace luci_interpreter

{

namespace kernels

{


InstanceNorm::InstanceNorm(const Tensor *input, const Tensor *gamma, const Tensor *beta,

                           Tensor *output, const InstanceNormParams &params)

  : KernelWithParams<InstanceNormParams>({input, gamma, beta}, {output}, params)

{

}

InstanceNorm::InstanceNorm(const Tensor *input, const Tensor *gamma, const Tensor *beta, {…}


void InstanceNorm::configure()

{

  LUCI_INTERPRETER_CHECK(input()->element_type() == output()->element_type());

  LUCI_INTERPRETER_CHECK(gamma()->element_type() == input()->element_type());

  if (input()->shape().num_dims() == 4)

  {

    LUCI_INTERPRETER_CHECK(input()->shape().num_dims() == 4);

    LUCI_INTERPRETER_CHECK(gamma()->shape().num_dims() == 1);

    LUCI_INTERPRETER_CHECK(gamma()->shape().dim(0) == input()->shape().dim(3) ||

                           gamma()->shape().dim(0) == 1);

    LUCI_INTERPRETER_CHECK(beta()->element_type() == input()->element_type());

    LUCI_INTERPRETER_CHECK(beta()->shape().num_dims() == 1);

    LUCI_INTERPRETER_CHECK(beta()->shape().dim(0) == input()->shape().dim(3) ||

                           beta()->shape().dim(0) == 1);

  }

  else if (input()->shape().num_dims() == 3)

  {

    LUCI_INTERPRETER_CHECK(input()->shape().num_dims() == 3);

    LUCI_INTERPRETER_CHECK(input()->element_type() == output()->element_type());

    LUCI_INTERPRETER_CHECK(gamma()->element_type() == input()->element_type());

    LUCI_INTERPRETER_CHECK(gamma()->shape().num_dims() == 1);

    LUCI_INTERPRETER_CHECK(gamma()->shape().dim(0) == input()->shape().dim(1) ||

                           gamma()->shape().dim(0) == 1);

    LUCI_INTERPRETER_CHECK(beta()->element_type() == input()->element_type());

    LUCI_INTERPRETER_CHECK(beta()->shape().num_dims() == 1);

    LUCI_INTERPRETER_CHECK(beta()->shape().dim(0) == input()->shape().dim(1) ||

                           beta()->shape().dim(0) == 1);

  }

  else

    LUCI_INTERPRETER_CHECK(false && "luci-intp InstanceNorm unsupported rank.");


  output()->resize(input()->shape());

}

void InstanceNorm::configure() {…}


void InstanceNorm::execute() const

{

  switch (input()->element_type())

  {

    case DataType::FLOAT32:

      evalFloat();

      break;

    default:

      throw std::runtime_error("luci-intp InstanceNorm Unsupported type.");

  }

}

void InstanceNorm::execute() const {…}


void InstanceNorm::evalFloat() const

{

  float activation_min, activation_max;

  calculateActivationRange(params().activation, &activation_min, &activation_max);

  tflite::RuntimeShape input_shape = getTensorShape(input());

  auto output_shape = getTensorShape(output());


  const float *input_data = getTensorData<float>(input());

  const float *gamma_data = getTensorData<float>(gamma());

  auto gamma_shape = getTensorShape(gamma());

  bool single_gamma = gamma_shape.DimensionsCount() == 1 && gamma_shape.Dims(0) == 1;

  const float *beta_data = getTensorData<float>(beta());

  auto beta_shape = getTensorShape(beta());

  bool single_beta = beta_shape.DimensionsCount() == 1 && beta_shape.Dims(0) == 1;

  float *output_data = getTensorData<float>(output());


  if (input_shape.DimensionsCount() == 4)

  {

    // Dimensions for image case are (N x H x W x C)

    const int32_t batches = tflite::MatchingDim(input_shape, 0, output_shape, 0);

    const int32_t heights = tflite::MatchingDim(input_shape, 1, output_shape, 1);

    const int32_t widths = tflite::MatchingDim(input_shape, 2, output_shape, 2);

    const int32_t channels = tflite::MatchingDim(input_shape, 3, output_shape, 3);

    for (int32_t batch = 0; batch < batches; batch++)

    {

      for (int32_t channel = 0; channel < channels; channel++)

      {

        double sum = 0.0f;

        double square_sum = 0.0f;

        int32_t size = heights * widths;

        for (int32_t height = 0; height < heights; height++)

        {

          for (int32_t width = 0; width < widths; width++)

          {

            double input_val =

              input_data[tflite::Offset(input_shape, batch, height, width, channel)];

            sum += input_val;

            square_sum += (input_val * input_val);

          }

        }

        double mean = sum / size;

        double var = square_sum / size - mean * mean;


        double gamma = single_gamma ? gamma_data[0] : gamma_data[channel];

        double beta = single_beta ? beta_data[0] : beta_data[channel];

        double a = gamma / (std::sqrt(var + params().epsilon));

        double b = -mean * a + beta;


        for (int32_t height = 0; height < heights; height++)

        {

          for (int32_t width = 0; width < widths; width++)

          {

            double input_value =

              input_data[tflite::Offset(output_shape, batch, height, width, channel)];

            double output_value = input_value * a + b;

            output_data[tflite::Offset(output_shape, batch, height, width, channel)] =

              tflite::ActivationFunctionWithMinMax((float)output_value, activation_min,

                                                   activation_max);

          }

        }

      }

    }

  }

  else if (input_shape.DimensionsCount() == 3)

  {

    // Dimensions for non image case are (N x C x D1 x D2 … Dn)

    const int32_t batches = tflite::MatchingDim(input_shape, 0, output_shape, 0);

    const int32_t channels = tflite::MatchingDim(input_shape, 1, output_shape, 1);

    const int32_t size = tflite::MatchingDim(input_shape, 2, output_shape, 2);

    for (int32_t batch = 0; batch < batches; batch++)

    {

      for (int32_t channel = 0; channel < channels; channel++)

      {

        double sum = 0.0f;

        double square_sum = 0.0f;

        size_t offset =

          static_cast<size_t>(batch * channels * size) + static_cast<size_t>(channel * size);

        for (int32_t i = 0; i < size; i++)

        {

          double input_val = input_data[offset + i];

          sum += input_val;

          square_sum += (input_val * input_val);

        }

        double mean = sum / size;

        double var = square_sum / size - mean * mean;


        double gamma = single_gamma ? gamma_data[0] : gamma_data[channel];

        double beta = single_beta ? beta_data[0] : beta_data[channel];

        double a = gamma / (std::sqrt(var + params().epsilon));

        double b = -mean * a + beta;


        for (int32_t i = 0; i < size; i++)

        {

          double input_value = input_data[offset + i];

          double output_value = input_value * a + b;

          output_data[offset + i] = tflite::ActivationFunctionWithMinMax(

            (float)output_value, activation_min, activation_max);

        }

      }

    }

  }

  else

    throw std::runtime_error("luci-intp InstanceNorm unsupported rank.");

}


} // namespace kernels

} // namespace luci_interpreter

luci_interpreter::KernelWithParams
Definition Kernel.h:58

luci_interpreter::KernelWithParams< InstanceNormParams >::params
const InstanceNormParams & params() const
Definition Kernel.h:67

luci_interpreter::Tensor
Definition Tensor.h:101

luci_interpreter::Tensor::resize
void resize(const Shape &new_shape)
Definition Tensor.cpp:56

luci_interpreter::kernels::InstanceNorm::execute
void execute() const override
Definition InstanceNorm.cpp:69

luci_interpreter::kernels::InstanceNorm::beta
const Tensor * beta() const
Definition InstanceNorm.h:36

luci_interpreter::kernels::InstanceNorm::input
const Tensor * input() const
Definition InstanceNorm.h:34

luci_interpreter::kernels::InstanceNorm::configure
void configure() override
Definition InstanceNorm.cpp:35

luci_interpreter::kernels::InstanceNorm::gamma
const Tensor * gamma() const
Definition InstanceNorm.h:35

luci_interpreter::kernels::InstanceNorm::output
Tensor * output() const
Definition InstanceNorm.h:37

luci_interpreter::kernels::InstanceNorm::InstanceNorm
InstanceNorm(const Tensor *input, const Tensor *gamma, const Tensor *beta, Tensor *output, const InstanceNormParams &params)
Definition InstanceNorm.cpp:29

LUCI_INTERPRETER_CHECK
#define LUCI_INTERPRETER_CHECK(cond)
Definition Utils.h:36

offset
__global uchar * offset(const Image *img, int x, int y)
Definition helpers.h:540

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

infer.input_data
list input_data
Definition infer.py:29

jpeg2hdf5.b
b
Definition jpeg2hdf5.py:105

luci_interpreter::kernels::getTensorShape
tflite::RuntimeShape getTensorShape(const Tensor *tensor)
Definition Utils.h:194

luci_interpreter::kernels::calculateActivationRange
void calculateActivationRange(Activation activation, T *activation_min, T *activation_max)
Definition Utils.cpp:52

luci_interpreter
Definition BuddyMemoryManager.h:22

mir_caffe2::SupportedCaffe2OpType::sum
@ sum

part_eval_one.output_data
output_data
Definition part_eval_one.py:112

size
int32_t size[5]
Definition Slice.cpp:35

luci_interpreter::InstanceNormParams
Definition KernelParams.h:122