ONE/backend_2xnnpack_2_kernel_generator_8cc_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "KernelGenerator.h"


#include "ops/ConvolutionLayer.h"

#include "ops/DepthwiseConvolutionLayer.h"

#include "ops/FullyConnectedLayer.h"


#include <backend/Backend.h>

#include <backend/IConfig.h>

#include <memory>

#include <util/Utils.h>

#include <util/logging.h>

#include <exec/DynamicShapeInferer.h>


#include <stdexcept>


namespace onert

{

namespace backend

{

namespace xnnpack

{


KernelGenerator::KernelGenerator(

  const ir::Graph &graph, const std::shared_ptr<TensorBuilder> &tensor_builder,

  const std::shared_ptr<basic::TensorRegistry> &tensor_reg,

  const std::shared_ptr<backend::custom::IKernelBuilder> &kernel_builder,

  const std::shared_ptr<ExternalContext> &external_context)

  : basic::KernelGeneratorBase{graph}, _ctx(graph.operands()), _operations_ctx{graph.operations()},

    _tensor_builder(tensor_builder), _tensor_reg{tensor_reg}, _kernel_builder(kernel_builder),

    _external_context(external_context)

{

  // DO NOTHING

}


std::unique_ptr<exec::FunctionSequence> KernelGenerator::generate(ir::OperationIndex ind)

{

  auto ret = std::make_unique<exec::FunctionSequence>();


  assert(_tensor_builder->dynamicTensorManager());

  assert(_tensor_reg);


  // Prepare to handle dynamic tensors later

  auto dyn_ctx = std::make_shared<exec::FunctionSequence::DynamicTensorCtx>();

  {

    dyn_ctx->op = &_operations_ctx.at(ind);

    dyn_ctx->dynamic_shape_inferer = std::make_shared<exec::DynamicShapeInferer>(_tensor_reg);

  }

  ret->dynamic_tensor_ctx(dyn_ctx);


  auto &op = _graph.operations().at(ind);

  op.accept(*this);

  assert(_return_fn); // _return_fn must have been generated

  ret->append(std::move(_return_fn));


  for (auto &&ind : (op.getInputs() | ir::Remove::UNDEFINED) + op.getOutputs())

  {

    auto tensor = _tensor_reg->getNativeTensor(ind);

    if (tensor)

    {

      tensor->increase_ref();

    }

  }

  return ret;

}


void KernelGenerator::visit(const ir::operation::Conv2D &node)

{

  using ir::operation::Conv2D;


  const auto ofm_index{node.getOutputs().at(0)};

  const auto ifm_index{node.getInputs().at(Conv2D::Input::INPUT)};

  const auto ker_index{node.getInputs().at(Conv2D::Input::KERNEL)};

  const auto bias_index{node.getInputs().at(Conv2D::Input::BIAS)};


  auto ofm_tensor = _tensor_reg->getPortableTensor(ofm_index);

  auto ifm_tensor = _tensor_reg->getPortableTensor(ifm_index);

  auto ker_tensor = _tensor_reg->getPortableTensor(ker_index);

  auto bias_tensor = _tensor_reg->getPortableTensor(bias_index);


  const auto stride = node.param().stride;

  const auto activation = node.param().activation;

  const auto &param_padding = node.param().padding;

  const auto dilation = node.param().dilation;

  auto fn = std::make_unique<ops::ConvolutionLayer>(_external_context);


  const auto ifm_shape = _ctx.at(ifm_index).shape().asFeature();

  const auto ofm_shape = _ctx.at(ofm_index).shape().asFeature();

  // Kernel format is [depth_out, kernel_height, kernel_width, depth_in].

  const auto &ker_shape = _ctx.at(ker_index).shape();

  const auto ker_height = ker_shape.dim(1);

  const auto ker_width = ker_shape.dim(2);


  const auto padding =

    ir::calculatePadding(param_padding, ifm_shape, ofm_shape, stride, ker_width, ker_height,

                         dilation.width_factor, dilation.height_factor);


  fn->configure(ifm_tensor, ker_tensor, bias_tensor, param_padding.type, padding.left,

                padding.right, padding.top, padding.bottom, stride.horizontal, stride.vertical,

                dilation.width_factor, dilation.height_factor, activation, ofm_tensor);


  _return_fn = std::move(fn);

}


void KernelGenerator::visit(const ir::operation::DepthwiseConv2D &node)

{

  using ir::operation::DepthwiseConv2D;


  const auto ofm_index{node.getOutputs().at(0)};

  const auto ifm_index{node.getInputs().at(DepthwiseConv2D::Input::INPUT)};

  const auto ker_index{node.getInputs().at(DepthwiseConv2D::Input::KERNEL)};

  const auto bias_index{node.getInputs().at(DepthwiseConv2D::Input::BIAS)};


  const auto stride = node.param().stride;

  const auto ifm_shape = _ctx.at(ifm_index).shape().asFeature();

  const auto ofm_shape = _ctx.at(ofm_index).shape().asFeature();

  // Kernel format is [1, kernel_height, kernel_width, depth_out].

  const auto &ker_shape = _ctx.at(ker_index).shape();

  const auto ker_height = ker_shape.dim(1);

  const auto ker_width = ker_shape.dim(2);

  const auto dilation_width = node.param().dilation.width_factor;

  const auto dilation_height = node.param().dilation.height_factor;

  const auto &param_padding = node.param().padding;

  const auto padding = ir::calculatePadding(param_padding, ifm_shape, ofm_shape, stride, ker_width,

                                            ker_height, dilation_width, dilation_height);

  const auto multiplier = node.param().multiplier;

  const auto activation = node.param().activation;


  auto ofm_tensor = _tensor_reg->getPortableTensor(ofm_index);

  auto ifm_tensor = _tensor_reg->getPortableTensor(ifm_index);

  auto ker_tensor = _tensor_reg->getPortableTensor(ker_index);

  auto bias_tensor = _tensor_reg->getPortableTensor(bias_index);


  auto fn = std::make_unique<ops::DepthwiseConvolutionLayer>(_external_context);


  fn->configure(ifm_tensor, ker_tensor, bias_tensor, param_padding.type, padding.left,

                padding.right, padding.top, padding.bottom, stride.horizontal, stride.vertical,

                multiplier, dilation_width, dilation_height, activation, ofm_tensor);


  _return_fn = std::move(fn);

}


void KernelGenerator::visit(const ir::operation::FullyConnected &node)

{

  using ir::operation::FullyConnected;


  const auto output_index{node.getOutputs().at(0)};

  const auto input_index{node.getInputs().at(FullyConnected::Input::INPUT)};

  const auto weight_index{node.getInputs().at(FullyConnected::Input::WEIGHT)};

  const auto bias_index{node.getInputs().at(FullyConnected::Input::BIAS)};

  const auto activation = node.param().activation;


  auto output_tensor = _tensor_reg->getPortableTensor(output_index);

  auto input_tensor = _tensor_reg->getPortableTensor(input_index);

  auto weight_tensor = _tensor_reg->getPortableTensor(weight_index);

  auto bias_tensor = bias_index.undefined() ? nullptr : _tensor_reg->getPortableTensor(bias_index);


  auto fn = std::make_unique<ops::FullyConnectedLayer>(_external_context);


  fn->configure(input_tensor, weight_tensor, bias_tensor, activation, output_tensor);


  _return_fn = std::move(fn);

}


} // namespace xnnpack

} // namespace backend

} // namespace onert

DynamicShapeInferer.h

IConfig.h

onert::backend::xnnpack::KernelGenerator::KernelGenerator
KernelGenerator(const ir::Graph &graph, const std::shared_ptr< TensorBuilder > &tensor_builder, const std::shared_ptr< basic::TensorRegistry > &tensor_reg, const std::shared_ptr< custom::IKernelBuilder > &kernel_builder, const std::shared_ptr< ExternalContext > &external_context)

onert::ir::OperandIndexSequence::at
const OperandIndex & at(IOIndex set_index) const
Definition OperandIndexSequence.h:50

onert::ir::Operation::getOutputs
const OperandIndexSequence & getOutputs() const override
Definition Operation.h:55

onert::ir::Operation::getInputs
OperandIndexSequence & getInputs()
Definition Operation.h:53

onert::ir::operation::Conv2D
Definition Conv2D.h:34

onert::ir::operation::Conv2D::param
const Param & param() const
Definition Conv2D.h:60

onert::util::Index< uint32_t, OperationIndexTag >

KernelGenerator.h

GenH5RandomInputs.graph
graph
Definition GenH5RandomInputs.py:48

GenH5RandomInputs.input_index
input_index
Definition GenH5RandomInputs.py:60

onert
Definition CustomKernel.cc:20

part_eval_one.output_tensor
output_tensor
Definition part_eval_one.py:116

Backend.h

logging.h

Utils.h
This file contains utility macro.

onert::ir::operation::Conv2D::Param::padding
Padding padding
Definition Conv2D.h:46

onert::ir::operation::Conv2D::Param::dilation
Dilation dilation
Definition Conv2D.h:48

onert::ir::operation::Conv2D::Param::activation
Activation activation
Definition Conv2D.h:47

onert::ir::operation::Conv2D::Param::stride
Stride stride
Definition Conv2D.h:45