ONE/service_2src_2_nodes_2_circle_strided_slice_8cpp_source.html

/*

 * Copyright (c) 2021 Samsung Electronics Co., Ltd. All Rights Reserved

 * Copyright 2018 The TensorFlow Authors. All Rights Reserved.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */

#include "luci/Service/CircleShapeInference.h"


#include "Check.h"

#include "CircleCloneNode.h"

#include "CircleShapeInferenceHelper.h"


#include <luci/IR/CircleNode.h>

#include <loco/IR/DataType.h>

#include <loco/IR/NodeShape.h>

#include <oops/InternalExn.h>


#include <algorithm>

#include <cmath>

#include <cstdint>

#include <limits>


namespace luci

{


luci::CircleNode *CloneNodeLet<CN::STUV>::visit(const luci::CircleStridedSlice *node)

{

  auto *cloned = _graph->nodes()->create<luci::CircleStridedSlice>();

  {

    cloned->begin_mask(node->begin_mask());

    cloned->end_mask(node->end_mask());

    cloned->ellipsis_mask(node->ellipsis_mask());

    cloned->new_axis_mask(node->new_axis_mask());

    cloned->shrink_axis_mask(node->shrink_axis_mask());

  }

  return cloned;

}

luci::CircleNode *CloneNodeLet<CN::STUV>::visit(const luci::CircleStridedSlice *node) {…}


// code referenced from

// https://github.com/tensorflow/tensorflow/blob/3f878cff5b698b82eea85db2b60d65a2e320850e/

//    tensorflow/lite/kernels/strided_slice.cc

//    tensorflow/lite/kernels/internal/strided_slice_logic.h

namespace sinf

{


// This Op only supports 1-5D cases and since we use the reference 4D

// implementation, the 1-3D tensors are mapped to 4D.

const int kMaxDim = 5;


const loco::DataType S32 = loco::DataType::S32;


struct StridedSliceParams

{

  int8_t start_indices_count = 0;

  int32_t start_indices[kMaxDim] = {0};

  int8_t stop_indices_count = 0;

  int32_t stop_indices[kMaxDim] = {0};

  int8_t strides_count = 0;

  int32_t strides[kMaxDim] = {0};


  int16_t begin_mask = 0;

  int16_t ellipsis_mask = 0;

  int16_t end_mask = 0;

  int16_t new_axis_mask = 0;

  int16_t shrink_axis_mask = 0;

};

struct StridedSliceParams {…};


struct StridedSliceContext

{


  StridedSliceContext(const luci::CircleStridedSlice *node)

  {

    // check overflow issues

    assert(static_cast<int16_t>(node->begin_mask()) == node->begin_mask());

    assert(static_cast<int16_t>(node->ellipsis_mask()) == node->ellipsis_mask());

    assert(static_cast<int16_t>(node->end_mask()) == node->end_mask());

    assert(static_cast<int16_t>(node->new_axis_mask()) == node->new_axis_mask());

    assert(static_cast<int16_t>(node->shrink_axis_mask()) == node->shrink_axis_mask());


    params.begin_mask = node->begin_mask();

    params.ellipsis_mask = node->ellipsis_mask();

    params.end_mask = node->end_mask();

    params.new_axis_mask = node->new_axis_mask();

    params.shrink_axis_mask = node->shrink_axis_mask();


    input = loco::must_cast<luci::CircleNode *>(node->input());

    begin = loco::must_cast<luci::CircleConst *>(node->begin());

    end = loco::must_cast<luci::CircleConst *>(node->end());

    strides = loco::must_cast<luci::CircleConst *>(node->strides());


    loco::TensorShape input_shape = circle_shape(input);

    input_dims = static_cast<int64_t>(input_shape.rank());

  }

  StridedSliceContext(const luci::CircleStridedSlice *node) {…}

  StridedSliceParams params;

  luci::CircleNode *input = nullptr;

  luci::CircleConst *begin = nullptr;

  luci::CircleConst *end = nullptr;

  luci::CircleConst *strides = nullptr;


  // Equivalent input shape after adding axis according to new_axis_mask.

  loco::TensorShape effective_input_shape;

  int64_t input_dims = 0;

};

struct StridedSliceContext {…};


// Use until std::clamp() is available from C++17.


inline int Clamp(const int32_t v, const int32_t lo, const int32_t hi)

{

  LUCI_ASSERT(!(hi < lo), "Clamp hi < lo");

  if (hi < v)

    return hi;

  if (v < lo)

    return lo;

  return v;

}

inline int Clamp(const int32_t v, const int32_t lo, const int32_t hi) {…}


// Return the index for the first element along that axis. This index will be a

// positive integer between [0, axis_size - 1] that can be used to index

// directly into the data.


inline int64_t StartForAxis(const StridedSliceParams &params, const loco::TensorShape &input_shape,

                            int64_t axis)

{

  const auto begin_mask = params.begin_mask;

  const auto *start_indices = params.start_indices;

  const auto *strides = params.strides;

  const int64_t axis_size = static_cast<int64_t>(input_shape.dim(axis).value());

  if (axis_size == 0)

  {

    return 0;

  }

  // Begin with the specified index.

  int64_t start = start_indices[axis];


  // begin_mask override

  if (begin_mask & (1LL << axis))

  {

    if (strides[axis] > 0)

    {

      // Forward iteration - use the first element. These values will get

      // clamped below (Note: We could have set them to 0 and axis_size-1, but

      // use lowest() and max() to maintain symmetry with StopForAxis())

      start = std::numeric_limits<int32_t>::lowest();

    }

    else

    {

      // Backward iteration - use the last element.

      start = std::numeric_limits<int32_t>::max();

    }

  }


  // Handle negative indices

  if (start < 0)

  {

    start += axis_size;

  }


  // Clamping

  if (strides[axis] > 0)

  {

    // Forward iteration

    start = Clamp(start, 0, axis_size);

  }

  else

  {

    // Backward iteration

    start = Clamp(start, -1, axis_size - 1);

  }


  return start;

}

inline int64_t StartForAxis(const StridedSliceParams &params, const loco::TensorShape &input_shape, {…}


// Return the "real" index for the end of iteration along that axis. This is an

// "end" in the traditional C sense, in that it points to one past the last

// element. ie. So if you were iterating through all elements of a 1D array of

// size 4, this function would return 4 as the stop, because it is one past the

// "real" indices of 0, 1, 2 & 3.


inline int64_t StopForAxis(const StridedSliceParams &params, const loco::TensorShape &input_shape,

                           int64_t axis, int64_t start_for_axis)

{

  const auto end_mask = params.end_mask;

  const auto shrink_axis_mask = params.shrink_axis_mask;

  const auto *stop_indices = params.stop_indices;

  const auto *strides = params.strides;

  const int64_t axis_size = static_cast<int64_t>(input_shape.dim(axis).value());

  if (axis_size == 0)

  {

    return 0;

  }


  // Begin with the specified index

  const bool shrink_axis = shrink_axis_mask & (1LL << axis);

  int64_t stop = stop_indices[axis];


  // When shrinking an axis, the end position does not matter (and can be

  // incorrect when negative indexing is used, see Issue #19260). Always use

  // start_for_axis + 1 to generate a length 1 slice, since start_for_axis has

  // already been adjusted for negative indices.

  if (shrink_axis)

  {

    return start_for_axis + 1;

  }


  // end_mask override

  if (end_mask & (1LL << axis))

  {

    if (strides[axis] > 0)

    {

      // Forward iteration - use the last element. These values will get

      // clamped below

      stop = std::numeric_limits<int32_t>::max();

    }

    else

    {

      // Backward iteration - use the first element.

      stop = std::numeric_limits<int32_t>::lowest();

    }

  }


  // Handle negative indices

  if (stop < 0)

  {

    stop += axis_size;

  }


  // Clamping

  // Because the end index points one past the last element, we need slightly

  // different clamping ranges depending on the direction.

  if (strides[axis] > 0)

  {

    // Forward iteration

    stop = Clamp(stop, 0, axis_size);

  }

  else

  {

    // Backward iteration

    stop = Clamp(stop, -1, axis_size - 1);

  }


  return stop;

}

inline int64_t StopForAxis(const StridedSliceParams &params, const loco::TensorShape &input_shape, {…}


StridedSliceParams BuildStridedSliceParams(StridedSliceContext *op_context)

{

  StridedSliceParams op_params;


  // The ellipsis_mask and new_axis_mask in op_params are not used. Those masks

  // are processed here to update begin_mask, end_mask and the index range.

  op_params.begin_mask = 0;

  op_params.ellipsis_mask = 0;

  op_params.end_mask = 0;

  op_params.new_axis_mask = 0;

  op_params.shrink_axis_mask = 0;


  // Count indexes where the new_axis_mask is set but the ellipsis_mask is not.

  loco::TensorShape begin_shape = circle_shape(op_context->begin);

  const int64_t begin_count = static_cast<int64_t>(begin_shape.dim(0).value());

  int64_t num_add_axis = 0;

  for (int64_t i = 0; i < begin_count; ++i)

  {

    if (!((1LL << i) & op_context->params.ellipsis_mask) &&

        ((1LL << i) & op_context->params.new_axis_mask))

    {

      num_add_axis++;

    }

  }


  // Calculate the dims of input after adding new axises.

  const int64_t effective_dims = op_context->input_dims + num_add_axis;


  // If begin, end and strides are not fully provided, it means Ellipsis should

  // be expanded to multiple dimensions (Ex: for spec [Ellipsis, 2] on a 3D

  // input, the Ellipsis should be applied for the first 2 dimensions). Besides,

  // If the new_axis_mask and the ellipsis_mask are set at the same index, the

  // new_axis_mask will have no effect.

  int64_t effective_ellipsis_mask = 0, effective_new_axis_mask = 0;

  int64_t ellipsis_start_idx = effective_dims, expanded_ellipsis = 0;

  for (int64_t i = 0; i < effective_dims;)

  {

    if ((1LL << i) & op_context->params.ellipsis_mask)

    {

      ellipsis_start_idx = i;

      int64_t ellipsis_end_idx =

        std::max(i + 1, std::min(i + 1 + num_add_axis + op_context->input_dims - begin_count,

                                 effective_dims));

      expanded_ellipsis = ellipsis_end_idx - ellipsis_start_idx - 1;


      // Set bit for effective_ellipsis_mask.

      for (; i < ellipsis_end_idx; ++i)

      {

        effective_ellipsis_mask |= (1LL << i);

      }

      continue;

    }


    if ((1LL << (i - expanded_ellipsis)) & op_context->params.new_axis_mask)

    {

      effective_new_axis_mask |= (1LL << i);

    }

    ++i;

  }


  // Calculate effective_input_shape and its corresponding begin, end, strides.

  loco::TensorShape input_shape = circle_shape(op_context->input);

  int64_t added_ellipsis = 0, added_axises = 0;

  // make sure no overflow

  assert(static_cast<uint32_t>(effective_dims) == effective_dims);

  op_context->effective_input_shape.rank(effective_dims);


  for (int64_t i = 0; i < effective_dims; ++i)

  {

    if ((1LL << i) & effective_ellipsis_mask)

    {

      // If ellipsis_mask, set the begin_mask and end_mask at that index.

      added_ellipsis = std::max(int64_t(0), i - ellipsis_start_idx);

      assert(i < 16);

      op_params.begin_mask |= (1LL << i);

      op_params.end_mask |= (1LL << i);

      op_params.strides[i] = 1;

      op_context->effective_input_shape.dim(i) = input_shape.dim(i - added_axises);

    }

    else if ((1LL << i) & effective_new_axis_mask)

    {

      // If new_axis_mask is set, it is equivalent to adding a new dim of 1 to

      // input tensor. Store added shape to effective_input_shape.

      op_params.start_indices[i] = 0;

      op_params.stop_indices[i] = 1;

      op_params.strides[i] = 1;

      op_context->effective_input_shape.dim(i) = loco::Dimension(1);

      added_axises++;

    }

    else if (i >= begin_count + expanded_ellipsis)

    {

      op_params.start_indices[i] = 0;

      op_params.stop_indices[i] = 0;

      op_params.strides[i] = 1;

      assert(i < 16);

      op_params.begin_mask |= (1LL << i);

      op_params.end_mask |= (1LL << i);

      op_context->effective_input_shape.dim(i) = input_shape.dim(i - added_axises);

    }

    else

    {

      const int64_t orig_idx = i - added_ellipsis;

      op_params.start_indices[i] = op_context->begin->at<S32>(orig_idx);

      op_params.stop_indices[i] = op_context->end->at<S32>(orig_idx);

      op_params.strides[i] = op_context->strides->at<S32>(orig_idx);

      if (op_context->params.begin_mask & (1LL << orig_idx))

      {

        assert(i < 16);

        op_params.begin_mask |= (1LL << i);

      }

      if (op_context->params.end_mask & (1LL << orig_idx))

      {

        assert(i < 16);

        op_params.end_mask |= (1LL << i);

      }

      if (op_context->params.shrink_axis_mask & (1LL << orig_idx))

      {

        assert(i < 16);

        op_params.shrink_axis_mask |= (1LL << i);

      }

      op_context->effective_input_shape.dim(i) = input_shape.dim(i - added_axises);

    }

  }


  // make sure no overflow

  assert(static_cast<int8_t>(effective_dims) == static_cast<int32_t>(effective_dims));


  op_params.start_indices_count = effective_dims;

  op_params.stop_indices_count = effective_dims;

  op_params.strides_count = effective_dims;


  return op_params;

}

StridedSliceParams BuildStridedSliceParams(StridedSliceContext *op_context) {…}


loco::TensorShape Algorithm::visit(const luci::CircleStridedSlice *node)

{

  loco::TensorShape output_shape;


  auto input_node = loco::must_cast<luci::CircleNode *>(node->input());


  auto begin_node = loco::must_cast<luci::CircleNode *>(node->begin());

  auto end_node = loco::must_cast<luci::CircleNode *>(node->end());

  auto strides_node = loco::must_cast<luci::CircleNode *>(node->strides());


  LUCI_ASSERT(begin_node->dtype() == S32, "Only support S32 for begin_node");

  LUCI_ASSERT(end_node->dtype() == S32, "Only support S32 for end_node");

  LUCI_ASSERT(strides_node->dtype() == S32, "Only support S32 for strides_node");


  LUCI_ASSERT(begin_node->rank() == 1, "Only support rank 1 for begin_node");

  LUCI_ASSERT(end_node->rank() == 1, "Only support rank 1 for end_node");

  LUCI_ASSERT(strides_node->rank() == 1, "Only support rank 1 for strides_node");


  auto begin_const = dynamic_cast<luci::CircleConst *>(node->begin());

  auto end_const = dynamic_cast<luci::CircleConst *>(node->end());

  auto strides_const = dynamic_cast<luci::CircleConst *>(node->strides());

  // TODO support non-const strides_node

  if (strides_const == nullptr)

  {

    INTERNAL_EXN("StridedSlice strides node is not Constant");

  }

  if (begin_const == nullptr || end_const == nullptr)

  {

    // The dimensions of the output shape are all set to unknown.

    output_shape.rank(input_node->rank());

    return output_shape;

  }


  loco::TensorShape input_shape = circle_shape(input_node);


  assert(begin_const->size<S32>() <= input_shape.rank());

  assert(end_const->size<S32>() <= input_shape.rank());

  assert(strides_const->size<S32>() <= input_shape.rank());


  StridedSliceContext op_context(node);

  auto op_params = BuildStridedSliceParams(&op_context);

  auto &effective_input_shape = op_context.effective_input_shape;

  std::vector<int64_t> output_shape_vector;

  std::vector<bool> output_known_vector;


  for (int32_t idx = effective_input_shape.rank() - 1; idx >= 0; --idx)

  {

    int32_t stride = op_params.strides[idx];

    LUCI_ASSERT(stride != 0, "stride value has to be non-zero");


    int64_t begin = StartForAxis(op_params, effective_input_shape, idx);

    int64_t end = StopForAxis(op_params, effective_input_shape, idx, begin);


    // When shrinking an axis, the end position does not matter (and can be

    // incorrect when negative indexing is used, see Issue #19260). Always use

    // begin + 1 to generate a length 1 slice, since begin has

    // already been adjusted for negative indices by GetBeginValueAtIndex.

    const bool shrink_axis = op_params.shrink_axis_mask & (1 << idx);

    if (shrink_axis)

    {

      end = begin + 1;

    }


    // This is valid for both positive and negative strides

    int64_t dim_shape = std::ceil((end - begin) / static_cast<float>(stride));

    dim_shape = dim_shape < 0 ? 0 : dim_shape;

    if (!shrink_axis)

    {

      output_shape_vector.push_back(dim_shape);

      output_known_vector.push_back(effective_input_shape.dim(idx).known());

    }

  }


  auto shape_size = output_shape_vector.size();

  output_shape.rank(shape_size);

  for (uint32_t idx = 0; idx < shape_size; ++idx)

  {

    bool known = output_known_vector[shape_size - 1u - idx];

    if (not known)

      continue;

    int64_t dim = output_shape_vector.at(shape_size - 1u - idx);

    LUCI_ASSERT(0 <= dim && dim < 0xfffffffL, "Dimension size exceeds limit");

    // reverse copy

    output_shape.dim(idx) = static_cast<uint32_t>(dim);

  }


  return output_shape;

}

loco::TensorShape Algorithm::visit(const luci::CircleStridedSlice *node) {…}


} // namespace sinf

} // namespace luci

CircleCloneNode.h

CircleShapeInference.h

CircleShapeInferenceHelper.h

InternalExn.h

INTERNAL_EXN
#define INTERNAL_EXN(msg)
@ brief throw internal exception with message
Definition InternalExn.h:25

NodeShape.h

loco::Dimension
The value of one dimension in a tensor shape.
Definition Dimension.h:30

loco::Dimension::value
uint32_t value(void) const
Return the value.
Definition Dimension.h:51

loco::TensorShape
Definition TensorShape.h:29

loco::TensorShape::dim
const Dimension & dim(uint32_t axis) const
Definition TensorShape.h:38

loco::TensorShape::rank
uint32_t rank(void) const
Definition TensorShape.h:35

luci::CircleConst
Class to build tensor data.
Definition CircleConst.h:35

luci::CircleConst::at
const loco::DataTypeImpl< DT >::Type & at(uint32_t n) const
Definition CircleConst.cpp:38

luci::CircleStridedSlice
STRIDED_SLICE in Circle.
Definition CircleStridedSlice.h:33

luci::CircleStridedSlice::input
loco::Node * input(void) const
Definition CircleStridedSlice.h:35

luci::CircleStridedSlice::begin_mask
int32_t begin_mask() const
Definition CircleStridedSlice.h:48

luci::CircleStridedSlice::shrink_axis_mask
int32_t shrink_axis_mask() const
Definition CircleStridedSlice.h:60

luci::CircleStridedSlice::end_mask
int32_t end_mask() const
Definition CircleStridedSlice.h:51

luci::CircleStridedSlice::begin
loco::Node * begin(void) const
Definition CircleStridedSlice.h:38

luci::CircleStridedSlice::ellipsis_mask
int32_t ellipsis_mask() const
Definition CircleStridedSlice.h:54

luci::CircleStridedSlice::new_axis_mask
int32_t new_axis_mask() const
Definition CircleStridedSlice.h:57

luci::CircleStridedSlice::strides
loco::Node * strides(void) const
Definition CircleStridedSlice.h:44

luci::CircleStridedSlice::end
loco::Node * end(void) const
Definition CircleStridedSlice.h:41

luci::CloneNodeLet
Definition CircleCloneNode.h:39

luci::sinf::Algorithm::visit
loco::TensorShape visit(const luci::CircleNode *node) final
Default fallback.
Definition CircleShapeInference.h:42

DataType.h

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

LUCI_ASSERT
#define LUCI_ASSERT(condition, msg)
Definition Check.h:26

CircleNode.h

loco::DataType
DataType
"scalar" value type
Definition DataType.h:27

luci::sinf::StopForAxis
int64_t StopForAxis(const StridedSliceParams &params, const loco::TensorShape &input_shape, int64_t axis, int64_t start_for_axis)
Definition CircleStridedSlice.cpp:185

luci::sinf::S32
const loco::DataType S32
Definition CircleStridedSlice.cpp:60

luci::sinf::Clamp
int Clamp(const int32_t v, const int32_t lo, const int32_t hi)
Definition CircleStridedSlice.cpp:115

luci::sinf::circle_shape
loco::TensorShape circle_shape(const luci::CircleNode *node)
Definition CircleShapeInferenceHelper.cpp:143

luci::sinf::StartForAxis
int64_t StartForAxis(const StridedSliceParams &params, const loco::TensorShape &input_shape, int64_t axis)
Definition CircleStridedSlice.cpp:128

luci::sinf::BuildStridedSliceParams
StridedSliceParams BuildStridedSliceParams(StridedSliceContext *op_context)
Definition CircleStridedSlice.cpp:250

luci::sinf::kMaxDim
const int kMaxDim
Definition CircleStridedSlice.cpp:58

luci
Definition DepthwiseConv2D.h:24

luci::input_node
CircleInput * input_node(loco::Graph *g, const loco::GraphInputIndex &index)
Find a Pull node with a given input index.
Definition CircleNodes.cpp:45

begin_count
int8_t begin_count
Definition Slice.cpp:32

begin
int32_t begin[5]
Definition Slice.cpp:33

luci::CircleNode
Definition CircleNodeDecl.h:40

luci::sinf::StridedSliceContext
Definition CircleStridedSlice.cpp:79

luci::sinf::StridedSliceContext::input_dims
int64_t input_dims
Definition CircleStridedSlice.cpp:111

luci::sinf::StridedSliceContext::strides
luci::CircleConst * strides
Definition CircleStridedSlice.cpp:107

luci::sinf::StridedSliceContext::params
StridedSliceParams params
Definition CircleStridedSlice.cpp:103

luci::sinf::StridedSliceContext::begin
luci::CircleConst * begin
Definition CircleStridedSlice.cpp:105

luci::sinf::StridedSliceContext::input
luci::CircleNode * input
Definition CircleStridedSlice.cpp:104

luci::sinf::StridedSliceContext::end
luci::CircleConst * end
Definition CircleStridedSlice.cpp:106

luci::sinf::StridedSliceContext::StridedSliceContext
StridedSliceContext(const luci::CircleStridedSlice *node)
Definition CircleStridedSlice.cpp:80

luci::sinf::StridedSliceContext::effective_input_shape
loco::TensorShape effective_input_shape
Definition CircleStridedSlice.cpp:110

luci::sinf::StridedSliceParams
Definition CircleStridedSlice.cpp:63

luci::sinf::StridedSliceParams::begin_mask
int16_t begin_mask
Definition CircleStridedSlice.cpp:71

luci::sinf::StridedSliceParams::strides_count
int8_t strides_count
Definition CircleStridedSlice.cpp:68

luci::sinf::StridedSliceParams::end_mask
int16_t end_mask
Definition CircleStridedSlice.cpp:73

luci::sinf::StridedSliceParams::shrink_axis_mask
int16_t shrink_axis_mask
Definition CircleStridedSlice.cpp:75

luci::sinf::StridedSliceParams::stop_indices
int32_t stop_indices[kMaxDim]
Definition CircleStridedSlice.cpp:67

luci::sinf::StridedSliceParams::new_axis_mask
int16_t new_axis_mask
Definition CircleStridedSlice.cpp:74

luci::sinf::StridedSliceParams::start_indices
int32_t start_indices[kMaxDim]
Definition CircleStridedSlice.cpp:65

luci::sinf::StridedSliceParams::ellipsis_mask
int16_t ellipsis_mask
Definition CircleStridedSlice.cpp:72

luci::sinf::StridedSliceParams::start_indices_count
int8_t start_indices_count
Definition CircleStridedSlice.cpp:64

luci::sinf::StridedSliceParams::strides
int32_t strides[kMaxDim]
Definition CircleStridedSlice.cpp:69

luci::sinf::StridedSliceParams::stop_indices_count
int8_t stop_indices_count
Definition CircleStridedSlice.cpp:66