ONE/compute_2cker_2include_2cker_2operation_2_batch_to_space_n_d_8h_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 * Copyright 2017 The TensorFlow Authors. All Rights Reserved.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef __NNFW_CKER_BATCH_TO_SPACE_ND_H__

#define __NNFW_CKER_BATCH_TO_SPACE_ND_H__


#include "cker/Shape.h"


#define UNUSED(x) ((void)(x))


namespace nnfw

{

namespace cker

{


// Helper methods for BatchToSpaceND.

// `spatial_index_dim` specifies post-crop offset index in this spatial

// dimension, i.e. spatial offset introduced by flattening batch to spatial

// dimension minus the crop size at beginning. `block_shape_dim` is the block

// size in current dimension. `input_dim` and `output_dim` are input and output

// size of BatchToSpaceND operation in current dimension.

// Output start index is inclusive and end index is exclusive.


inline void GetIndexRange(int spatial_index_dim, int block_shape_dim, int input_dim, int output_dim,

                          int *start_index, int *end_index)

{

  // (*start_index) * block_shape_dim is effectively rounded up to the next

  // multiple of block_shape_dim by the integer division.

  *start_index = std::max(0, (-spatial_index_dim + block_shape_dim - 1) / block_shape_dim);

  // Similarly, (*end_index) * block_shape_dim is rounded up too (note that

  // end_index is exclusive).

  *end_index =

    std::min(input_dim, (output_dim - spatial_index_dim + block_shape_dim - 1) / block_shape_dim);

}


template <typename T>


inline void BatchToSpaceND(const Shape &unextended_input1_shape, const T *input1_data,

                           const int32_t *block_shape_data, const int32_t *crops_data,

                           const Shape &unextended_output_shape, T *output_data)

{

  auto input_dim = unextended_input1_shape.DimensionsCount();

  auto output_dim = unextended_output_shape.DimensionsCount();


  assert(input_dim == 3 || input_dim == 4);

  assert(input_dim == output_dim);


  UNUSED(input_dim);

  UNUSED(output_dim);


  // Extends the input/output shape from 3D to 4D if needed, NHC -> NH1C.

  auto extend_shape = [](const Shape &shape) {

    if (shape.DimensionsCount() == 4)

    {

      return shape;

    }

    Shape new_shape(4, 1);

    new_shape.SetDim(0, shape.Dims(0));

    new_shape.SetDim(1, shape.Dims(1));

    new_shape.SetDim(3, shape.Dims(2));

    return new_shape;

  };

  const Shape input1_shape = extend_shape(unextended_input1_shape);

  const Shape output_shape = extend_shape(unextended_output_shape);


  const int32_t output_width = output_shape.Dims(2);

  const int32_t output_height = output_shape.Dims(1);

  const int32_t output_batch_size = output_shape.Dims(0);


  const int32_t depth = input1_shape.Dims(3);

  const int32_t input_width = input1_shape.Dims(2);

  const int32_t input_height = input1_shape.Dims(1);

  const int32_t input_batch_size = input1_shape.Dims(0);


  const int32_t block_shape_height = block_shape_data[0];

  const int32_t block_shape_width = block_shape_data[1];


  const int32_t crops_top = crops_data[0];

  const int32_t crops_left = crops_data[2];


  for (int in_batch = 0; in_batch < input_batch_size; ++in_batch)

  {

    const int out_batch = in_batch % output_batch_size;

    const int spatial_offset = in_batch / output_batch_size;


    int in_h_start = 0;

    int in_h_end = 0;

    // GetIndexRange ensures start and end indices are in [0, output_height).

    GetIndexRange(spatial_offset / block_shape_width - crops_top, block_shape_height, input_height,

                  output_height, &in_h_start, &in_h_end);


    for (int in_h = in_h_start; in_h < in_h_end; ++in_h)

    {

      const int out_h = in_h * block_shape_height + spatial_offset / block_shape_width - crops_top;

      assert(out_h >= 0);

      assert(out_h < output_height);


      int in_w_start = 0;

      int in_w_end = 0;

      // GetIndexRange ensures start and end indices are in [0, output_width).

      GetIndexRange(spatial_offset % block_shape_width - crops_left, block_shape_width, input_width,

                    output_width, &in_w_start, &in_w_end);


      for (int in_w = in_w_start; in_w < in_w_end; ++in_w)

      {

        const int out_w =

          in_w * block_shape_width + spatial_offset % block_shape_width - crops_left;

        assert(out_w >= 0);

        assert(out_w < output_width);

        T *out = output_data + Offset(output_shape, out_batch, out_h, out_w, 0);

        const T *in = input1_data + Offset(input1_shape, in_batch, in_h, in_w, 0);

        memcpy(out, in, depth * sizeof(T));

      }

    }

  }

}


} // namespace cker

} // namespace nnfw


#endif // __NNFW_CKER_BATCH_TO_SPACE_ND_H__

nnfw::cker::Shape
Definition Shape.h:32

nnfw::cker::Shape::DimensionsCount
int32_t DimensionsCount() const
Definition Shape.h:91

nnfw::cker::Shape::Dims
int32_t Dims(int i) const
Definition Shape.h:92

nnfw::cker::Shape::SetDim
void SetDim(int i, int32_t val)
Definition Shape.h:98

Shape.h

UNUSED
#define UNUSED(x)
Definition BatchToSpaceND.h:23

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

nnfw::cker::GetIndexRange
void GetIndexRange(int spatial_index_dim, int block_shape_dim, int input_dim, int output_dim, int *start_index, int *end_index)
Definition BatchToSpaceND.h:37

nnfw::cker::Offset
int Offset(const Shape &shape, int i0, int i1, int i2, int i3)
Definition Shape.h:237

nnfw::cker::BatchToSpaceND
void BatchToSpaceND(const Shape &unextended_input1_shape, const T *input1_data, const int32_t *block_shape_data, const int32_t *crops_data, const Shape &unextended_output_shape, T *output_data)
Definition BatchToSpaceND.h:50

nnfw
Definition topk_v2.h:30