ONE/onert-micro_2luci-interpreter_2src_2kernels_2_depthwise_conv2_d_8cpp_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 * Copyright 2019 The TensorFlow Authors. All Rights Reserved.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *    http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "ConvolutionCommon.h"

#include "kernels/Utils.h"


#include "PALDepthwiseConv2D.h"


namespace luci_interpreter

{


namespace

{


#ifndef DIS_FLOAT


void evalFloat(const circle::Tensor *input, const circle::Tensor *filter,

               const circle::Tensor *bias, const circle::Tensor *output,

               const circle::DepthwiseConv2DOptions *options, BaseRuntimeGraph *runtime_graph)

{

  float activation_min{};

  float activation_max{};

  kernels::calculateActivationRange(luci_actfunc(options->fused_activation_function()),

                                    &activation_min, &activation_max);


  luci_interpreter_pal::ConvParams params{};

  params.padding_values.height = computeConvPadding(

    input, filter, options->padding(), options->stride_h(), options->dilation_h_factor(), 1);

  params.padding_values.width = computeConvPadding(

    input, filter, options->padding(), options->stride_w(), options->dilation_w_factor(), 2);

  params.stride_height = options->stride_h();

  params.stride_width = options->stride_w();

  params.dilation_height_factor = options->dilation_h_factor();

  params.dilation_width_factor = options->dilation_w_factor();

  params.float_activation_min = activation_min;

  params.float_activation_max = activation_max;

  params.depth_multiplier = options->depth_multiplier();


  auto *input_data = runtime_graph->getDataByTensor(input);

  auto *output_data = runtime_graph->getDataByTensor(output);


  auto *filter_data = runtime_graph->getConstDataByTensor(filter);

  auto *bias_data = runtime_graph->getConstDataByTensor(bias);


  int32_t input_shape[kMaxSmallSize];

  kernels::getTensorDims(input, runtime_graph, input_shape);


  int32_t filter_shape[kMaxSmallSize];

  kernels::getTensorDims(filter, runtime_graph, filter_shape);


  int32_t output_shape[kMaxSmallSize];

  kernels::getTensorDims(output, runtime_graph, output_shape);


  luci_interpreter_pal::DepthwiseConv2D(

    params, input_shape, kernels::getTensorData<float>(input_data), filter_shape,

    kernels::getTensorData<float>(filter_data), kernels::getTensorData<float>(bias_data),

    output_shape, kernels::getTensorData<float>(output_data));

}


#endif // DIS_FLOAT


} // namespace


void configure_kernel_CircleDepthwiseConv2D(const circle::Operator *cur_op,

                                            BaseRuntimeGraph *runtime_graph)

{

  kernels::DownsamplingConv2DKernel kernel(cur_op, runtime_graph);


  const auto input = kernel.input();

  const auto filter = kernel.filter();

  const auto bias = kernel.bias();

  const auto output = kernel.output();


  auto filter_data = runtime_graph->getConstDataByTensor(filter);


  assert(filter_data != nullptr);


  const auto *options = cur_op->builtin_options_as_DepthwiseConv2DOptions();


  if (Tensor::element_type(input) == DataType::FLOAT32 &&

      Tensor::element_type(filter) == DataType::FLOAT32)

  {

    LUCI_INTERPRETER_CHECK(bias == nullptr || Tensor::element_type(bias) == DataType::FLOAT32);

  }

  else

  {

    assert(false && "Unsupported type.");

  }

  LUCI_INTERPRETER_CHECK(Tensor::element_type(output) == Tensor::element_type(input));

  LUCI_INTERPRETER_CHECK(Tensor::num_dims(input) == 4 && Tensor::num_dims(filter) == 4);


  const int32_t output_depth = Tensor::dim(output, 3);

  LUCI_INTERPRETER_CHECK(bias == nullptr ||

                         (Tensor::num_dims(bias) == 1 && Tensor::dim(bias, 0) == output_depth));


  switch (options->fused_activation_function())

  {

    case circle::ActivationFunctionType_NONE:

    case circle::ActivationFunctionType_RELU:

    case circle::ActivationFunctionType_RELU6:

    case circle::ActivationFunctionType_RELU_N1_TO_1:

      break;

    default:

      assert(false && "Unsupported fused activation");

  }

}

void configure_kernel_CircleDepthwiseConv2D(const circle::Operator *cur_op, {…}


void execute_kernel_CircleDepthwiseConv2D(const circle::Operator *cur_op,

                                          BaseRuntimeGraph *runtime_graph)

{

  kernels::DownsamplingConv2DKernel kernel(cur_op, runtime_graph);


  const auto input = kernel.input();

  const auto weights = kernel.filter();

  const auto bias = kernel.bias();

  const auto output = kernel.output();


  const auto *options = cur_op->builtin_options_as_DepthwiseConv2DOptions();


  switch (Tensor::element_type(input))

  {

#ifndef DIS_FLOAT

    case DataType::FLOAT32:

      if (Tensor::element_type(weights) == DataType::FLOAT32)

      {

        evalFloat(input, weights, bias, output, options, runtime_graph);

        break;

      }

#endif // DIS_FLOAT

    default:

      assert(false && "Unsupported type.");

  }

}

void execute_kernel_CircleDepthwiseConv2D(const circle::Operator *cur_op, {…}


} // namespace luci_interpreter

luci_interpreter::RuntimeGraph
Definition RuntimeGraph.h:33

luci_interpreter::RuntimeGraph::getConstDataByTensor
uint8_t * getConstDataByTensor(const circle::Tensor *raw_tensor)
Definition RuntimeGraph.cpp:398

luci_interpreter::kernels::DownsamplingConv2DKernel
Definition ConvolutionCommon.h:39

luci_interpreter::kernels::DownsamplingConv2DKernel::output
const circle::Tensor * output() const
Definition ConvolutionCommon.h:67

luci_interpreter::kernels::DownsamplingConv2DKernel::input
const circle::Tensor * input() const
Definition ConvolutionCommon.h:64

luci_interpreter::kernels::DownsamplingConv2DKernel::filter
const circle::Tensor * filter() const
Definition ConvolutionCommon.h:65

luci_interpreter::kernels::DownsamplingConv2DKernel::bias
const circle::Tensor * bias() const
Definition ConvolutionCommon.h:66

LUCI_INTERPRETER_CHECK
#define LUCI_INTERPRETER_CHECK(cond)
Definition Utils.h:36

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

infer.input_data
list input_data
Definition infer.py:29

luci_interpreter::kernels::calculateActivationRange
void calculateActivationRange(Activation activation, T *activation_min, T *activation_max)
Definition Utils.cpp:52

luci_interpreter::kernels::getTensorDims
void getTensorDims(const circle::Tensor *tensor, BaseRuntimeGraph *runtime_graph, int32_t *dims)
Definition Utils.h:121

luci_interpreter
Definition BuddyMemoryManager.h:22

luci_interpreter::configure_kernel_CircleDepthwiseConv2D
void configure_kernel_CircleDepthwiseConv2D(const circle::Operator *cur_op, BaseRuntimeGraph *runtime_graph)
Definition DepthwiseConv2D.cpp:78

luci_interpreter::BaseRuntimeGraph
RuntimeGraph BaseRuntimeGraph
Definition RuntimeModule.h:39

luci_interpreter::computeConvPadding
int32_t computeConvPadding(const circle::Tensor *input, const circle::Tensor *filter, circle::Padding padding_type, int32_t stride, int32_t dilation, int axis)
Definition ConvolutionCommon.cpp:41

luci_interpreter::execute_kernel_CircleDepthwiseConv2D
void execute_kernel_CircleDepthwiseConv2D(const circle::Operator *cur_op, BaseRuntimeGraph *runtime_graph)
Definition DepthwiseConv2D.cpp:122

luci::luci_actfunc
FusedActFunc luci_actfunc(const circle::ActivationFunctionType type)
Definition CircleReader.cpp:84

onnx_legalizer.options
options
Definition onnx_legalizer.py:1070

part_eval_one.output_data
output_data
Definition part_eval_one.py:112

ConvolutionCommon.h

circle_eval_diff::TensorShape::dim
const loco::Dimension & dim(uint32_t axis) const
Definition Tensor.h:44

luci_interpreter_pal::ConvParams
Definition Params.h:84

luci_interpreter_pal::ConvParams::padding_values
PaddingValues padding_values
Definition Params.h:86

luci_interpreter_pal::PaddingValues::height
int16_t height
Definition Params.h:74