ONE/compute_2cker_2include_2cker_2operation_2_resize_bilinear_8h_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 * Copyright 2017 The TensorFlow Authors. All Rights Reserved.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef __NNFW_CKER_RESIZEBILINEAR_H__

#define __NNFW_CKER_RESIZEBILINEAR_H__


#include "cker/Shape.h"

#include "cker/Types.h"

#include <cmath>


namespace nnfw

{

namespace cker

{


inline void ResizeBilinearKernel2x2(int32_t x0, int32_t x1, int32_t y0, int32_t y1, int32_t x,

                                    int32_t y, int32_t depth, int32_t batch,

                                    const Shape &input_shape, const float *input_data,

                                    const Shape &output_shape, float *output_data)

{

  const int32_t input_width = input_shape.Dims(2);

  const int32_t output_width = output_shape.Dims(2);


  const int32_t input_x_offset = (x1 - x0) * depth;

  const int32_t input_y_offset = (y1 - y0) * depth * input_width;

  const int32_t output_x_offset = depth;

  const int32_t output_y_offset = depth * output_width;


  for (int ch = 0; ch < depth; ch++)

  {

    const int32_t input_offset = Offset(input_shape, batch, y0, x0, ch);


    float x0y0 = input_data[input_offset];

    float x1y0 = input_data[input_offset + input_x_offset];

    float x0y1 = input_data[input_offset + input_y_offset];

    float x1y1 = input_data[input_offset + input_x_offset + input_y_offset];


    // Top left corner.

    const int32_t output_offset = Offset(output_shape, batch, y, x, ch);

    output_data[output_offset] = x0y0;


    // Top right corner.

    output_data[output_offset + output_x_offset] = (x0y0 + x1y0) / 2;


    // Bottom left corner.

    float output = (x0y0 + x0y1) / 2;

    output_data[output_offset + output_y_offset] = output;


    // Bottom right corner.

    output_data[output_offset + output_x_offset + output_y_offset] =

      (output + ((x1y0 + x1y1) / 2)) / 2;

  }

}


inline void ResizeBilinear2x2(int32_t batches, int32_t input_height, int32_t input_width,

                              int32_t depth, int32_t output_height, int32_t output_width,

                              const Shape &input_shape, const float *input_data,

                              const Shape &output_shape, float *output_data)

{

  for (int b = 0; b < batches; b++)

  {

    for (int y0 = 0, y = 0; y <= output_height - 2; y += 2, y0++)

    {

      for (int x0 = 0, x = 0; x <= output_width - 2; x += 2, x0++)

      {

        int32_t x1 = std::min(x0 + 1, input_width - 1);

        int32_t y1 = std::min(y0 + 1, input_height - 1);

        ResizeBilinearKernel2x2(x0, x1, y0, y1, x, y, depth, b, input_shape, input_data,

                                output_shape, output_data);

      }

    }

  }

}


inline void ResizeBilinearKernel(const float *input_ptr, int32_t depth, float scale,

                                 float *output_ptr)

{

  for (int32_t i = 0; i < depth; i++)

  {

    *output_ptr += *input_ptr * scale;

    output_ptr++;

    input_ptr++;

  }

}


inline void ComputeInterpolationValues(const float value, const float scale,

                                       const bool half_pixel_centers, int32_t input_size,

                                       float *scaled_value, int32_t *lower_bound,

                                       int32_t *upper_bound)

{

  if (half_pixel_centers)

  {

    *scaled_value = (value + 0.5f) * scale - 0.5f;

  }

  else

  {

    *scaled_value = value * scale;

  }

  float scaled_value_floor = std::floor(*scaled_value);

  *lower_bound = std::max(static_cast<int32_t>(scaled_value_floor), static_cast<int32_t>(0));

  *upper_bound = std::min(static_cast<int32_t>(std::ceil(*scaled_value)), input_size - 1);

}


inline void ResizeBilinearGeneric(int32_t batches, int32_t input_height, int32_t input_width,

                                  int32_t depth, int32_t output_height, int32_t output_width,

                                  float height_scale, float width_scale, const Shape &input_shape,

                                  const float *input_data, float *output_data,

                                  const bool half_pixel_centers)

{

  memset(output_data, 0, batches * output_height * output_width * depth * sizeof(float));


  int32_t output_offset = 0;

  for (int b = 0; b < batches; ++b)

  {

    for (int y = 0; y < output_height; ++y)

    {

      float input_y;

      int32_t y0, y1;

      ComputeInterpolationValues(y, height_scale, half_pixel_centers, input_height, &input_y, &y0,

                                 &y1);

      for (int x = 0; x < output_width; ++x)

      {

        float input_x;

        int32_t x0, x1;

        ComputeInterpolationValues(x, width_scale, half_pixel_centers, input_width, &input_x, &x0,

                                   &x1);

        float *output_ptr = &output_data[output_offset];


        // Run kernel on the 4 corners of the bilinear resize algorithm.

        int32_t input_offset = Offset(input_shape, b, y0, x0, 0);

        float scale = (1 - (input_y - y0)) * (1 - (input_x - x0));

        const float *input_ptr = &input_data[input_offset];

        ResizeBilinearKernel(input_ptr, depth, scale, output_ptr);


        input_offset = Offset(input_shape, b, y0, x1, 0);

        scale = (1 - (input_y - y0)) * (input_x - x0);

        input_ptr = &input_data[input_offset];

        ResizeBilinearKernel(input_ptr, depth, scale, output_ptr);


        input_offset = Offset(input_shape, b, y1, x0, 0);

        scale = (input_y - y0) * (1 - (input_x - x0));

        input_ptr = &input_data[input_offset];

        ResizeBilinearKernel(input_ptr, depth, scale, output_ptr);


        input_offset = Offset(input_shape, b, y1, x1, 0);

        scale = (input_y - y0) * (input_x - x0);

        input_ptr = &input_data[input_offset];

        ResizeBilinearKernel(input_ptr, depth, scale, output_ptr);


        output_offset += depth;

      }

    }

  }

}


template <typename T>


inline void ResizeBilinearGenericSmallChannel(int32_t batches, int32_t input_height,

                                              int32_t input_width, int32_t depth,

                                              int32_t output_height, int32_t output_width,

                                              float height_scale, float width_scale,

                                              const Shape &input_shape, const T *input_data,

                                              T *output_data, const bool half_pixel_centers)

{

  T *output_ptr = &output_data[0];

  for (int b = 0; b < batches; ++b)

  {

    for (int y = 0; y < output_height; ++y)

    {

      float input_y;

      int32_t y0, y1;

      ComputeInterpolationValues(y, height_scale, half_pixel_centers, input_height, &input_y, &y0,

                                 &y1);

      for (int x = 0; x < output_width; ++x)

      {

        float input_x;

        int32_t x0, x1;

        ComputeInterpolationValues(x, width_scale, half_pixel_centers, input_width, &input_x, &x0,

                                   &x1);


        int32_t input_offset[4] = {

          Offset(input_shape, b, y0, x0, 0), Offset(input_shape, b, y0, x1, 0),

          Offset(input_shape, b, y1, x0, 0), Offset(input_shape, b, y1, x1, 0)};

        float scale[4] = {(1 - (input_y - y0)) * (1 - (input_x - x0)),

                          (1 - (input_y - y0)) * (input_x - x0),

                          (input_y - y0) * (1 - (input_x - x0)), (input_y - y0) * (input_x - x0)};


        for (int d = 0; d < depth; d++)

        {

          const T *input_ptr = &input_data[d];

          *output_ptr++ = static_cast<T>(

            input_ptr[input_offset[0]] * scale[0] + input_ptr[input_offset[1]] * scale[1] +

            input_ptr[input_offset[2]] * scale[2] + input_ptr[input_offset[3]] * scale[3]);

        }

      }

    }

  }

}


void ResizeBilinear(ResizeBilinearParams &params, const Shape &input_shape, const float *input_data,

                    const Shape &output_shape, float *output_data)

{

  int32_t batches = static_cast<int32_t>(MatchingDim(input_shape, 0, output_shape, 0));

  int32_t input_height = input_shape.Dims(1);

  int32_t input_width = input_shape.Dims(2);

  int32_t depth = static_cast<int32_t>(MatchingDim(input_shape, 3, output_shape, 3));


  // Specialize for 2x2 upsample.

  if (!params.align_corners && !params.half_pixel_centers &&

      params.output_height == 2 * input_height && params.output_width == 2 * input_width)

  {

    ResizeBilinear2x2(batches, input_height, input_width, depth, params.output_height,

                      params.output_width, input_shape, input_data, output_shape, output_data);

  }

  else

  {

    float height_scale = static_cast<float>(input_height) / params.output_height;

    float width_scale = static_cast<float>(input_width) / params.output_width;

    if (params.align_corners && params.output_height > 1)

    {

      height_scale = static_cast<float>(input_height - 1) / (params.output_height - 1);

    }

    if (params.align_corners && params.output_width > 1)

    {

      width_scale = static_cast<float>(input_width - 1) / (params.output_width - 1);

    }


    ResizeBilinearGeneric(batches, input_height, input_width, depth, params.output_height,

                          params.output_width, height_scale, width_scale, input_shape, input_data,

                          output_data, params.half_pixel_centers);

  }

}


void ResizeBilinear(ResizeBilinearParams &params, const Shape &input_shape,

                    const uint8_t *input_data, const Shape &output_shape, uint8_t *output_data)

{

  int32_t batches = MatchingDim(input_shape, 0, output_shape, 0);

  int32_t input_height = input_shape.Dims(1);

  int32_t input_width = input_shape.Dims(2);

  int32_t depth = MatchingDim(input_shape, 3, output_shape, 3);


  float height_scale = (params.align_corners && params.output_height > 1)

                         ? (static_cast<float>(input_height - 1) / (params.output_height - 1))

                         : (static_cast<float>(input_height) / params.output_height);


  float width_scale = (params.align_corners && params.output_width > 1)

                        ? (static_cast<float>(input_width - 1) / (params.output_width - 1))

                        : (static_cast<float>(input_width) / params.output_width);


  ResizeBilinearGenericSmallChannel<uint8_t>(

    batches, input_height, input_width, depth, params.output_height, params.output_width,

    height_scale, width_scale, input_shape, input_data, output_data, params.half_pixel_centers);

}


inline void ComputeInterpolationValues(const int32_t value, const int32_t scale_10,

                                       const bool half_pixel_centers, int32_t input_size,

                                       int32_t *scaled_value, int32_t *lower_bound,

                                       int32_t *upper_bound)

{

  if (half_pixel_centers)

  {

    *scaled_value = value * scale_10 + scale_10 / 2 - (1 << 9);

  }

  else

  {

    *scaled_value = value * scale_10;

  }

  *lower_bound = std::max(*scaled_value / (1 << 10), 0);

  *upper_bound = std::min(*scaled_value / (1 << 10) + 1, input_size - 1);

}


inline void ResizeBilinear(const ResizeBilinearParams &op_params,

                           const Shape &unextended_input_shape, const int8_t *input_data,

                           const Shape &unextended_output_shape, int8_t *output_data)

{

  // If half_pixel_centers is True, align_corners must be False.

  assert(!op_params.half_pixel_centers || !op_params.align_corners);

  assert(unextended_input_shape.DimensionsCount() <= 4);

  assert(unextended_output_shape.DimensionsCount() <= 4);

  const Shape input_shape = Shape::ExtendedShape(4, unextended_input_shape);

  const Shape output_shape = Shape::ExtendedShape(4, unextended_output_shape);


  const int32_t batches = MatchingDim(input_shape, 0, output_shape, 0);

  const int32_t input_height = input_shape.Dims(1);

  const int32_t input_width = input_shape.Dims(2);

  const int32_t depth = MatchingDim(input_shape, 3, output_shape, 3);


  const int32_t output_height = op_params.output_height;

  const int32_t output_width = op_params.output_width;


  int32_t height_scale_10 = ((1 << 10) * input_height + output_height / 2) / output_height;

  int32_t width_scale_10 = ((1 << 10) * input_width + output_width / 2) / output_width;

  if (op_params.align_corners && output_height > 1)

  {

    height_scale_10 =

      ((1 << 10) * (input_height - 1) + (output_height - 1) / 2) / (output_height - 1);

  }

  if (op_params.align_corners && output_width > 1)

  {

    width_scale_10 = ((1 << 10) * (input_width - 1) + (output_width - 1) / 2) / (output_width - 1);

  }


  for (int b = 0; b < batches; ++b)

  {

    for (int y = 0; y < output_height; ++y)

    {

      int32_t input_y, y0, y1;

      ComputeInterpolationValues(y, height_scale_10, op_params.half_pixel_centers, input_height,

                                 &input_y, &y0, &y1);

      for (int x = 0; x < output_width; ++x)

      {

        int32_t input_x, x0, x1;

        ComputeInterpolationValues(x, width_scale_10, op_params.half_pixel_centers, input_width,

                                   &input_x, &x0, &x1);

        for (int c = 0; c < depth; ++c)

        {

          const int64_t output_20_ll =

            static_cast<int64_t>(input_data[Offset(input_shape, b, y0, x0, c)]) *

            ((1 << 10) - (input_y - (1 << 10) * y0)) * ((1 << 10) - (input_x - (1 << 10) * x0));

          const int64_t output_20_lu =

            static_cast<int64_t>(input_data[Offset(input_shape, b, y1, x0, c)]) *

            (input_y - (1 << 10) * y0) * ((1 << 10) - (input_x - (1 << 10) * x0));

          const int64_t output_20_rl =

            static_cast<int64_t>(input_data[Offset(input_shape, b, y0, x1, c)]) *

            ((1 << 10) - (input_y - (1 << 10) * y0)) * (input_x - (1 << 10) * x0);

          const int64_t output_20_ru =

            static_cast<int64_t>(input_data[Offset(input_shape, b, y1, x1, c)]) *

            (input_y - (1 << 10) * y0) * (input_x - (1 << 10) * x0);

          const int64_t output_20 = output_20_ll + output_20_lu + output_20_rl + output_20_ru;

          const int64_t round = (output_20 > 0) ? (1 << 19) : -(1 << 19);

          const int8_t interpolation = static_cast<int8_t>((output_20 + round) / (1 << 20));

          output_data[Offset(output_shape, b, y, x, c)] = interpolation;

        }

      }

    }

  }

}


} // namespace cker

} // namespace nnfw


#endif // __NNFW_CKER_RESIZEBILINEAR_H__

nnfw::cker::Shape
Definition Shape.h:32

nnfw::cker::Shape::DimensionsCount
int32_t DimensionsCount() const
Definition Shape.h:91

nnfw::cker::Shape::Dims
int32_t Dims(int i) const
Definition Shape.h:92

Shape.h

Types.h

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

nnfw::cker::MatchingDim
int MatchingDim(const Shape &shape1, int index1, const Shape &shape2, int index2)
Definition Shape.h:220

nnfw::cker::ResizeBilinear2x2
void ResizeBilinear2x2(int32_t batches, int32_t input_height, int32_t input_width, int32_t depth, int32_t output_height, int32_t output_width, const Shape &input_shape, const float *input_data, const Shape &output_shape, float *output_data)
Definition ResizeBilinear.h:69

nnfw::cker::ResizeBilinearGeneric
void ResizeBilinearGeneric(int32_t batches, int32_t input_height, int32_t input_width, int32_t depth, int32_t output_height, int32_t output_width, float height_scale, float width_scale, const Shape &input_shape, const float *input_data, float *output_data, const bool half_pixel_centers)
Definition ResizeBilinear.h:118

nnfw::cker::Offset
int Offset(const Shape &shape, int i0, int i1, int i2, int i3)
Definition Shape.h:237

nnfw::cker::ResizeBilinearKernel
void ResizeBilinearKernel(const float *input_ptr, int32_t depth, float scale, float *output_ptr)
Definition ResizeBilinear.h:89

nnfw::cker::ResizeBilinearGenericSmallChannel
void ResizeBilinearGenericSmallChannel(int32_t batches, int32_t input_height, int32_t input_width, int32_t depth, int32_t output_height, int32_t output_width, float height_scale, float width_scale, const Shape &input_shape, const T *input_data, T *output_data, const bool half_pixel_centers)
Definition ResizeBilinear.h:171

nnfw::cker::ResizeBilinear
void ResizeBilinear(ResizeBilinearParams &params, const Shape &input_shape, const float *input_data, const Shape &output_shape, float *output_data)
Definition ResizeBilinear.h:213

nnfw::cker::ResizeBilinearKernel2x2
void ResizeBilinearKernel2x2(int32_t x0, int32_t x1, int32_t y0, int32_t y1, int32_t x, int32_t y, int32_t depth, int32_t batch, const Shape &input_shape, const float *input_data, const Shape &output_shape, float *output_data)
Definition ResizeBilinear.h:30

nnfw::cker::ComputeInterpolationValues
void ComputeInterpolationValues(const float value, const float scale, const bool half_pixel_centers, int32_t input_size, float *scaled_value, int32_t *lower_bound, int32_t *upper_bound)
Definition ResizeBilinear.h:100

nnfw
Definition topk_v2.h:30

nnfw::cker::ResizeBilinearParams
Definition Types.h:318

nnfw::cker::ResizeBilinearParams::align_corners
bool align_corners
Definition Types.h:321

nnfw::cker::ResizeBilinearParams::output_width
int32_t output_width
Definition Types.h:320

nnfw::cker::ResizeBilinearParams::output_height
int32_t output_height
Definition Types.h:319

nnfw::cker::ResizeBilinearParams::half_pixel_centers
bool half_pixel_centers
Definition Types.h:322