ONE/backend_2train_2_kernel_generator_8cc_source.html

/*

 * Copyright (c) 2023 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "KernelGenerator.h"


#include "ops/BackPropAccumulator.h"

#include "ops/BinaryArithmeticLayer.h"

#include "ops/ConvolutionLayer.h"

#include "ops/DepthwiseConvolutionLayer.h"

#include "ops/ElementwiseActivationLayer.h"

#include "ops/FullyConnectedLayer.h"

#include "ops/LossMeanSquaredErrorLayer.h"

#include "ops/LossCategoricalCrossentropyLayer.h"

#include "ops/MeanLayer.h"

#include "ops/GradientApplier.h"

#include "ops/PadLayer.h"

#include "ops/PoolLayer.h"

#include "ops/ReshapeLayer.h"

#include "ops/SoftMaxLayer.h"


#include <backend/Backend.h>

#include <backend/IConfig.h>

#include <memory>

#include <util/logging.h>

#include <exec/DynamicShapeInferer.h>


#include <stdexcept>


namespace onert::backend::train

{


namespace

{

ops::ElementwiseActivationType

convertElementwiseActivationType(ir::operation::ElementwiseActivation::Type type_ir)

{

  switch (type_ir)

  {

    case ir::operation::ElementwiseActivation::Type::RELU:

      return ops::ElementwiseActivationType::kReLU;

    default:

      throw std::runtime_error("train KernelGenerator : Not supported operation yet");

  }

}


ops::PoolType convertPoolType(ir::operation::Pool2D::PoolType type_ir)

{

  switch (type_ir)

  {

    // TODO Implement AVG PoolType

    case ir::operation::Pool2D::PoolType::MAX:

      return ops::PoolType::kMax;

    case ir::operation::Pool2D::PoolType::AVG:

      return ops::PoolType::kAvg;

    default:

      throw std::runtime_error("train KernelGenerator : Not supported operation yet");

  }

}


std::unique_ptr<ops::BackPropAccumulator>

generateBackPropAccumulator(const IPortableTensor *disposable, BackPropTensor *gradient)

{

  auto update_fn = std::make_unique<ops::BackPropAccumulator>(disposable, gradient);

  return update_fn;

}


void appendBackPropAccumulators(const ir::train::ITrainableOperation &op,

                                const ir::OperationIndex &op_index, TensorRegistry *tensor_reg,

                                exec::train::TrainableFnSequence *seq)

{

  if (!op.isRequiredForBackward())

    return;


  for (const auto &input_index : (op.getInputs() | ir::Remove::UNDEFINED))

  {

    const auto disposable =

      tensor_reg->getDisposableBackPropTensor(DisposableTensorIndex{op_index, input_index});

    if (disposable != nullptr)

    {

      auto back_prop = tensor_reg->getBackPropTensor(input_index);

      assert(back_prop);

      seq->append(generateBackPropAccumulator(disposable, back_prop));

    }

  }

}


std::unique_ptr<ops::GradientApplier>

generateGradientApplier(const exec::train::optimizer::Optimizer *optimizer,

                        const IPortableTensor *gradient, ITrainableTensor *trainable)

{

  auto update_fn = std::make_unique<ops::GradientApplier>();

  update_fn->configure(optimizer, gradient, trainable);

  return update_fn;

}

} // namespace


std::unique_ptr<exec::train::TrainableFnSequence> KernelGenerator::generate(ir::OperationIndex idx)

{

  // NOTE This function is related to planning tensors. If you change this function, you should

  //      also consider to change planning tensors.


  auto ret = std::make_unique<exec::train::TrainableFnSequence>();


  const auto &op = _tgraph.operation(idx);


  // NOTE appendBackPropAccumulators() must be called before appending _return_fn to

  //      TrainableFnSequence as long as both are appended to the same TrainableFnSequence.

  appendBackPropAccumulators(op, idx, _tensor_reg.get(), ret.get());


  op.accept(*this);

  assert(_return_fn);

  ret->append(std::move(_return_fn));


  for (auto &&update_fn : _update_funcs)

    ret->append(std::move(update_fn));

  _update_funcs.clear();


  for (auto &&ind : (op.getInputs() | ir::Remove::UNDEFINED) + op.getOutputs())

  {

    auto tensor = _tensor_reg->getNonConstTensor(ind);

    if (tensor)

    {

      tensor->increase_ref();

    }

  }

  return ret;

}

std::unique_ptr<exec::train::TrainableFnSequence> KernelGenerator::generate(ir::OperationIndex idx) {…}


KernelGenerator::KernelGenerator(const ir::train::TrainableGraph &tgraph,

                                 const std::shared_ptr<TensorRegistry> &tensor_reg,

                                 const std::shared_ptr<ExternalContext> &external_context,

                                 const exec::train::optimizer::Optimizer *optimizer)

  : backend::train::KernelGeneratorBase{tgraph}, _tensor_reg{tensor_reg},

    _external_context(external_context), _optimizer{optimizer}, _update_funcs{}, _node_to_idx{}

{

  tgraph.operations().iterate(

    [&](const onert::ir::OperationIndex &idx, const onert::ir::IOperation &op) {

      assert(_node_to_idx.find(&op) == _node_to_idx.end());

      _node_to_idx[&op] = idx;

    });

}

KernelGenerator::KernelGenerator(const ir::train::TrainableGraph &tgraph, {…}


void KernelGenerator::visit(const ir::train::operation::BinaryArithmetic &node)

{

  using ir::train::operation::BinaryArithmetic;


  const auto output_index{node.getOutputs().at(0)};

  const auto lhs_index{node.getInputs().at(BinaryArithmetic::Input::LHS)};

  const auto rhs_index{node.getInputs().at(BinaryArithmetic::Input::RHS)};


  const auto arithmetic_type = node.param().arithmetic_type;

  const auto activation = node.param().activation;


  auto output_tensor = _tensor_reg->getPortableTensor(output_index);

  auto lhs_tensor = _tensor_reg->getPortableTensor(lhs_index);

  auto rhs_tensor = _tensor_reg->getPortableTensor(rhs_index);


  auto fn = std::make_unique<ops::BinaryArithmeticLayer>();

  fn->configure(lhs_tensor, rhs_tensor, output_tensor, activation,

                static_cast<cpu::ops::ArithmeticType>(arithmetic_type));


  if (node.isRequiredForBackward())

  {

    auto back_prop_output_tensor = getBackPropOut(output_index);

    auto back_prop_lhs_tensor = getBackPropIn(node, lhs_index);

    auto back_prop_rhs_tensor = getBackPropIn(node, rhs_index);


    fn->configureBackward(back_prop_lhs_tensor, back_prop_rhs_tensor, back_prop_output_tensor,

                          activation, static_cast<train::ops::ArithmeticType>(arithmetic_type));

  }

  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::BinaryArithmetic &node) {…}


void KernelGenerator::visit(const ir::train::operation::Conv2D &node)

{

  using ir::train::operation::Conv2D;


  const auto out_index{node.getOutputs().at(0)};

  const auto in_index{node.getInputs().at(Conv2D::Input::INPUT)};

  const auto ker_index{node.getInputs().at(Conv2D::Input::KERNEL)};

  const auto bias_index{node.getInputs().at(Conv2D::Input::BIAS)};


  auto out_tensor = _tensor_reg->getPortableTensor(out_index);

  auto in_tensor = _tensor_reg->getPortableTensor(in_index);

  auto ker_tensor = _tensor_reg->getTrainableTensor(ker_index);

  auto bias_tensor = _tensor_reg->getTrainableTensor(bias_index);


  // Generate kernel

  const auto stride = node.param().stride;

  const auto activation = node.param().activation;

  const auto &param_padding = node.param().padding;

  const auto dilation = node.param().dilation;

  auto fn = std::make_unique<ops::ConvolutionLayer>();


  auto &operands = _tgraph.operands();

  const auto ifm_shape = operands.at(in_index).shape().asFeature();

  const auto ofm_shape = operands.at(out_index).shape().asFeature();

  // Kernel format is [depth_out, kernel_height, kernel_width, depth_in].

  const auto &ker_shape = operands.at(ker_index).shape();

  const auto ker_height = ker_shape.dim(1);

  const auto ker_width = ker_shape.dim(2);


  const auto padding =

    ir::calculatePadding(param_padding, ifm_shape, ofm_shape, stride, ker_width, ker_height,

                         dilation.width_factor, dilation.height_factor);


  const bool is_cacheable_weights = false;

  fn->configure(in_tensor, ker_tensor, bias_tensor, param_padding.type, padding.left, padding.right,

                padding.top, padding.bottom, stride.horizontal, stride.vertical,

                dilation.width_factor, dilation.height_factor, activation, out_tensor,

                is_cacheable_weights);


  auto ker_grad_tensor = _tensor_reg->getGradientTensor(ker_index);

  auto bias_grad_tensor = _tensor_reg->getGradientTensor(bias_index);


  if (node.isRequiredForBackward())

  {


    auto out_back_prop_tensor = getBackPropOut(out_index);

    auto in_back_prop_tensor = getBackPropIn(node, in_index);


    fn->configureBackward(ker_tensor, in_back_prop_tensor, ker_grad_tensor, bias_grad_tensor,

                          out_back_prop_tensor, activation);


    // Generate GradientApplier

    if (bias_tensor)

      _update_funcs.emplace_back(

        generateGradientApplier(_optimizer, bias_grad_tensor, bias_tensor));

    _update_funcs.emplace_back(generateGradientApplier(_optimizer, ker_grad_tensor, ker_tensor));

  }


  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::Conv2D &node) {…}


void KernelGenerator::visit(const ir::train::operation::DepthwiseConv2D &node)

{

  using ir::train::operation::DepthwiseConv2D;


  const auto ofm_index{node.getOutputs().at(0)};

  const auto ifm_index{node.getInputs().at(DepthwiseConv2D::Input::INPUT)};

  const auto ker_index{node.getInputs().at(DepthwiseConv2D::Input::KERNEL)};

  const auto bias_index{node.getInputs().at(DepthwiseConv2D::Input::BIAS)};


  auto ofm_tensor = _tensor_reg->getPortableTensor(ofm_index);

  auto ifm_tensor = _tensor_reg->getPortableTensor(ifm_index);

  auto ker_tensor = _tensor_reg->getTrainableTensor(ker_index);

  auto bias_tensor = _tensor_reg->getTrainableTensor(bias_index);


  const auto stride = node.param().stride;

  const auto &operands = _tgraph.operands();

  const auto ofm_shape = operands.at(ofm_index).shape().asFeature();

  const auto ifm_shape = operands.at(ifm_index).shape().asFeature();

  // Kernel format is [1, kernel_height, kernel_width, depth_out].

  const auto &ker_shape = operands.at(ker_index).shape();

  const auto ker_height = ker_shape.dim(1);

  const auto ker_width = ker_shape.dim(2);

  const auto dilation_width = node.param().dilation.width_factor;

  const auto dilation_height = node.param().dilation.height_factor;

  const auto padding = ir::calculatePadding(node.param().padding, ifm_shape, ofm_shape, stride,

                                            ker_width, ker_height, dilation_width, dilation_height);

  const auto multiplier = node.param().multiplier;

  const auto activation = node.param().activation;


  auto fn = std::make_unique<ops::DepthwiseConvolutionLayer>();


  fn->configure(ifm_tensor, ker_tensor, bias_tensor, padding.left, padding.right, padding.top,

                padding.bottom, stride.horizontal, stride.vertical, multiplier, dilation_width,

                dilation_height, activation, ofm_tensor, _external_context);


  if (node.isRequiredForBackward())

  {

    auto ker_grad_tensor = _tensor_reg->getGradientTensor(ker_index);

    auto bias_grad_tensor = _tensor_reg->getGradientTensor(bias_index);


    auto ofm_back_prop_tensor = getBackPropOut(ofm_index);

    auto ifm_back_prop_tensor = getBackPropIn(node, ifm_index);


    fn->configureBackward(ifm_back_prop_tensor, ker_grad_tensor, bias_grad_tensor,

                          ofm_back_prop_tensor, activation);


    // Generate GradientApplier

    if (bias_tensor)

      _update_funcs.emplace_back(

        generateGradientApplier(_optimizer, bias_grad_tensor, bias_tensor));

    _update_funcs.emplace_back(generateGradientApplier(_optimizer, ker_grad_tensor, ker_tensor));

  }


  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::DepthwiseConv2D &node) {…}


void KernelGenerator::visit(const ir::train::operation::ElementwiseActivation &node)

{

  using ir::train::operation::ElementwiseActivation;


  const auto output_index{node.getOutputs().at(0)};

  const auto input_index{node.getInputs().at(ElementwiseActivation::Input::INPUT)};


  auto output_tensor = _tensor_reg->getPortableTensor(output_index);

  auto input_tensor = _tensor_reg->getPortableTensor(input_index);


  auto fn = std::make_unique<ops::ElementwiseActivationLayer>();


  auto convertToInferActivationType = [](const ir::operation::ElementwiseActivation::Type &type) {

    switch (type)

    {

      case ir::operation::ElementwiseActivation::Type::RELU:

        return cpu::ops::ElementwiseActivationType::kReLU;

      default:

        throw std::invalid_argument("Unsupported ElementwiseActivation::Type");

    }

  };


  fn->configure(input_tensor, output_tensor, node.param().alpha, node.param().beta,

                convertToInferActivationType(node.param().op_type));


  if (node.isRequiredForBackward())

  {

    auto back_prop_input_tensor = getBackPropIn(node, input_index);

    auto back_prop_output_tensor = getBackPropOut(output_index);


    fn->configureBackward(input_tensor, back_prop_input_tensor, back_prop_output_tensor,

                          node.param().alpha, node.param().beta,

                          convertElementwiseActivationType(node.param().op_type));

  }


  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::ElementwiseActivation &node) {…}


void KernelGenerator::visit(const ir::train::operation::FullyConnected &node)

{

  using ir::train::operation::FullyConnected;


  const auto out_index{node.getOutputs().at(0)};

  const auto in_index{node.getInputs().at(FullyConnected::Input::INPUT)};

  const auto weights_index{node.getInputs().at(FullyConnected::Input::WEIGHT)};

  const auto bias_index{node.getInputs().at(FullyConnected::Input::BIAS)};


  auto out_tensor = _tensor_reg->getPortableTensor(out_index);

  auto in_tensor = _tensor_reg->getPortableTensor(in_index);

  auto weights_tensor = _tensor_reg->getTrainableTensor(weights_index);

  auto bias_tensor = _tensor_reg->getTrainableTensor(bias_index);


  // Generate kernel

  const auto activation = node.param().activation;

  const auto weights_format = node.param().weights_format;


  auto fn = std::make_unique<ops::FullyConnectedLayer>();


  fn->configure(in_tensor, weights_tensor, bias_tensor, activation, weights_format, out_tensor,

                _external_context);


  if (node.isRequiredForBackward())

  {

    auto out_back_prop_tensor = getBackPropOut(out_index);

    auto in_back_prop_tensor = getBackPropIn(node, in_index);

    auto weights_grad_tensor = _tensor_reg->getGradientTensor(weights_index);

    auto bias_grad_tensor = _tensor_reg->getGradientTensor(bias_index);


    fn->configureBackward(in_tensor, weights_tensor, out_tensor, in_back_prop_tensor,

                          weights_grad_tensor, bias_grad_tensor, out_back_prop_tensor, activation,

                          weights_format);


    // Generate GradientAppliers

    if (bias_tensor)

      _update_funcs.emplace_back(

        generateGradientApplier(_optimizer, bias_grad_tensor, bias_tensor));

    _update_funcs.emplace_back(

      generateGradientApplier(_optimizer, weights_grad_tensor, weights_tensor));

  }


  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::FullyConnected &node) {…}


void KernelGenerator::visit(const ir::train::operation::Loss &node)

{

  using ir::train::operation::Loss;


  const auto output_index{node.getOutputs().at(0)};

  const auto y_pred_index{node.getInputs().at(Loss::Y_PRED)};

  const auto y_true_index{node.getInputs().at(Loss::Y_TRUE)};


  auto output_tensor = _tensor_reg->getPortableTensor(output_index);

  auto y_pred_tensor = _tensor_reg->getPortableTensor(y_pred_index);

  auto y_true_tensor = _tensor_reg->getPortableTensor(y_true_index);


  // TODO Use BackPropTensor directly instead of DisposableTensor if y_pred is always used by only

  //      loss

  auto back_prop_y_pred_tensor = getBackPropIn(node, y_pred_index);


  const auto loss_code = node.param().loss_code;

  const auto &loss_param = node.param().loss_param;

  const auto reduction_type = node.param().reduction_type;


  switch (loss_code)

  {

    case ir::train::LossCode::MeanSquaredError:

    {

      auto fn = std::make_unique<ops::LossMeanSquaredErrorLayer>();

      fn->configure(y_pred_tensor, y_true_tensor, output_tensor, back_prop_y_pred_tensor,

                    reduction_type);

      _return_fn = std::move(fn);

      break;

    }

    case ir::train::LossCode::CategoricalCrossentropy:

    {

      const auto y_pred_op_code = node.y_pred_op_code();

      bool is_normalization_required = (y_pred_op_code != ir::OpCode::Softmax);

      const auto cce_params = std::get_if<ir::train::CategoricalCrossentropyParam>(&loss_param);

      if (!cce_params)

      {

        throw std::runtime_error("LossLayer: Expected loss_param to be "

                                 "CategoricalCrossentropyParam but found a different type.");

      }

      auto fn = std::make_unique<ops::LossCategoricalCrossentropyLayer>();

      fn->configure(y_pred_tensor, y_true_tensor, output_tensor, back_prop_y_pred_tensor,

                    reduction_type, cce_params->axis, cce_params->label_smoothing,

                    is_normalization_required);

      _return_fn = std::move(fn);

      break;

    }

    default:

      throw std::runtime_error("LossLayer: unsupported loss type");

  }

}

void KernelGenerator::visit(const ir::train::operation::Loss &node) {…}


void KernelGenerator::visit(const ir::train::operation::Pad &node)

{

  const auto input_index{node.getInputs().at(ir::operation::Pad::Input::INPUT)};

  const auto pad_index{node.getInputs().at(ir::operation::Pad::Input::PAD)};

  const auto output_index{node.getOutputs().at(0)};


  auto input = _tensor_reg->getPortableTensor(input_index);

  auto pad = _tensor_reg->getPortableTensor(pad_index);

  auto output = _tensor_reg->getPortableTensor(output_index);


  auto fn = std::make_unique<ops::PadLayer>();


  IPortableTensor *value = nullptr;

  if (node.getInputs().size() == 3) // isPadV2

  {

    const auto value_index{node.getInputs().at(ir::operation::Pad::Input::VALUE)};

    value = _tensor_reg->getPortableTensor(value_index);

  }


  fn->configure(input, pad, value, output);

  if (node.isRequiredForBackward())

  {

    auto out_back_prop_tensor = getBackPropOut(output_index);

    auto in_back_prop_tensor = getBackPropIn(node, input_index);

    fn->configureBackward(in_back_prop_tensor, out_back_prop_tensor);

  }

  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::Pad &node) {…}


void KernelGenerator::visit(const ir::train::operation::Pool2D &node)

{

  using ir::train::operation::Pool2D;


  const auto output_index{node.getOutputs().at(0)};

  const auto input_index{node.getInputs().at(0)};


  const auto &operands = _tgraph.operands();

  const auto &ofm_shape = operands.at(output_index).shape();

  const auto &ifm_shape = operands.at(input_index).shape();


  if (ifm_shape.rank() != 4)

  {

    throw std::runtime_error(node.name() + " only supports 4D tensor as input");

  }


  // calculate padding

  const auto stride = node.param().stride;

  const auto kh = node.param().kh;

  const auto kw = node.param().kw;

  const auto padding = ir::calculatePadding(node.param().padding, ifm_shape.asFeature(),

                                            ofm_shape.asFeature(), stride, kw, kh);


  auto out_tensor = _tensor_reg->getPortableTensor(output_index);

  auto in_tensor = _tensor_reg->getPortableTensor(input_index);


  const auto activation = node.param().activation;

  const auto pool_type = convertPoolType(node.param().op_type);


  auto fn = std::make_unique<ops::PoolLayer>();


  auto convertToInferPoolType = [](const train::ops::PoolType &pool_type) {

    switch (pool_type)

    {

      case train::ops::PoolType::kMax:

        return cpu::ops::PoolType::kMax;

      case train::ops::PoolType::kAvg:

        return cpu::ops::PoolType::kAvg;

      default:

        throw std::runtime_error("PoolLayer: Unsupported pool type yet");

    }

  };


  fn->configure(in_tensor, padding.left, padding.right, padding.top, padding.bottom,

                stride.horizontal, stride.vertical, kw, kh, activation, out_tensor,

                convertToInferPoolType(pool_type));


  if (node.isRequiredForBackward())

  {

    auto out_back_prop_tensor = getBackPropOut(output_index);

    auto in_back_prop_tensor = getBackPropIn(node, input_index);

    fn->configureBackward(padding.left, padding.right, padding.top, padding.bottom,

                          stride.horizontal, stride.vertical, kw, kh, activation, pool_type,

                          out_tensor, in_back_prop_tensor, out_back_prop_tensor);

  }


  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::Pool2D &node) {…}


void KernelGenerator::visit(const ir::train::operation::Reduce &node)

{

  using ir::train::operation::Reduce;


  const auto output_index{node.getOutputs().at(0)};

  const auto input_index{node.getInputs().at(Reduce::Input::INPUT)};

  const auto axes_index{node.getInputs().at(Reduce::Input::AXES)};


  const auto keep_dims = node.param().keep_dims;


  auto output_tensor = _tensor_reg->getPortableTensor(output_index);

  auto input_tensor = _tensor_reg->getPortableTensor(input_index);

  auto axes_tensor = _tensor_reg->getPortableTensor(axes_index);


  if (node.param().reduce_type == ir::operation::Reduce::ReduceType::MEAN)

  {

    auto fn = std::make_unique<ops::MeanLayer>();

    fn->configure(input_tensor, axes_tensor, output_tensor, keep_dims);

    if (node.isRequiredForBackward())

    {

      auto back_prop_output_tensor = getBackPropOut(output_index);

      auto back_prop_input_tensor = getBackPropIn(node, input_index);

      fn->configureBackward(back_prop_input_tensor, back_prop_output_tensor);

    }

    _return_fn = std::move(fn);

  }

  else

  {

    throw std::runtime_error("ReduceLayer: unsupported reduce type");

  }

}

void KernelGenerator::visit(const ir::train::operation::Reduce &node) {…}


void KernelGenerator::visit(const ir::train::operation::Reshape &node)

{

  using ir::train::operation::Reshape;


  const auto output_index{node.getOutputs().at(0)};

  const auto input_index{node.getInputs().at(ir::operation::Reshape::Input::INPUT)};


  auto output_tensor = _tensor_reg->getPortableTensor(output_index);

  auto input_tensor = _tensor_reg->getPortableTensor(input_index);


  // optional 2nd input

  IPortableTensor *shape_tensor = nullptr;


  if (node.getInputs().size() == 2)

  {

    const auto shape_index{node.getInputs().at(ir::operation::Reshape::Input::SHAPE)};

    shape_tensor = _tensor_reg->getPortableTensor(shape_index);

  }


  auto fn = std::make_unique<ops::ReshapeLayer>();


  fn->configure(input_tensor, shape_tensor, output_tensor);

  if (node.isRequiredForBackward())

  {

    auto output_back_prop_tensor = getBackPropOut(output_index);

    auto input_back_prop_tensor = getBackPropIn(node, input_index);

    fn->configureBackward(input_back_prop_tensor, output_back_prop_tensor);

  }

  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::Reshape &node) {…}


void KernelGenerator::visit(const ir::train::operation::Softmax &node)

{

  using ir::train::operation::Softmax;


  const auto output_index{node.getOutputs().at(0)};

  const auto input_index{node.getInputs().at(ir::operation::Softmax::Input::INPUT)};


  const auto beta = node.param().beta;


  auto output_tensor = _tensor_reg->getPortableTensor(output_index);

  auto input_tensor = _tensor_reg->getPortableTensor(input_index);


  auto fn = std::make_unique<ops::SoftMaxLayer>();


  fn->configure(input_tensor, beta, output_tensor);


  if (node.isRequiredForBackward())

  {

    auto output_back_prop_tensor = getBackPropOut(output_index);

    auto input_back_prop_tensor = getBackPropIn(node, input_index);

    fn->configureBackward(input_back_prop_tensor, output_back_prop_tensor);

  }

  _return_fn = std::move(fn);

}

void KernelGenerator::visit(const ir::train::operation::Softmax &node) {…}


IPortableTensor *KernelGenerator::getBackPropIn(const ir::IOperation &node,

                                                const ir::OperandIndex &operand_index)

{

  const auto &op_index = _node_to_idx[&node];

  const auto backwarding_operand_index = ir::train::TrainingOperandIndex{operand_index, false};


  const auto disposable_tensor =

    _tensor_reg->getDisposableBackPropTensor(DisposableTensorIndex{op_index, operand_index});

  if (disposable_tensor != nullptr)

  {

    [[maybe_unused]] const auto &training_usedefs =

      _tgraph.trainingUseDefs().at(backwarding_operand_index);

    assert(std::count_if(training_usedefs.getTrainingDefs().begin(),

                         training_usedefs.getTrainingDefs().end(),

                         [&](const ir::train::TrainingOperationIndex &op_index) {

                           return _tgraph.operation(op_index.index()).isRequiredForBackward();

                         }) > 1);


    return disposable_tensor;

  }

  else

    return _tensor_reg->getBackPropTensor(operand_index);

}


IPortableTensor *KernelGenerator::getBackPropOut(const ir::OperandIndex &output_index)

{

  return _tensor_reg->getBackPropTensor(output_index);

}


} // namespace onert::backend::train

BackPropAccumulator.h

DynamicShapeInferer.h

GradientApplier.h

IConfig.h

LossCategoricalCrossentropyLayer.h

LossMeanSquaredErrorLayer.h

onert::backend::IPortableTensor
A tensor class that is portable for other backends.
Definition IPortableTensor.h:37

onert::backend::train::KernelGeneratorBase
Definition KernelGeneratorBase.h:31

onert::backend::train::KernelGeneratorBase::_return_fn
std::unique_ptr< exec::train::ITrainableFunction > _return_fn
Definition KernelGeneratorBase.h:49

onert::backend::train::KernelGeneratorBase::_tgraph
const ir::train::TrainableGraph & _tgraph
Definition KernelGeneratorBase.h:48

onert::backend::train::KernelGenerator::generate
std::unique_ptr< exec::train::TrainableFnSequence > generate(ir::OperationIndex op_ind) override
Definition KernelGenerator.cc:110

onert::backend::train::KernelGenerator::KernelGenerator
KernelGenerator(const ir::train::TrainableGraph &tgraph, const std::shared_ptr< TensorRegistry > &tensor_reg, const std::shared_ptr< ExternalContext > &external_context, const exec::train::optimizer::Optimizer *optimizer)
Definition KernelGenerator.cc:142

onert::backend::train::KernelGenerator::visit
void visit(const ir::train::operation::BinaryArithmetic &) override
Definition KernelGenerator.cc:156

onert::exec::train::optimizer::Optimizer
Base class for all optimizers.
Definition Optimizer.h:37

onert::ir::OperandIndexSequence::size
uint32_t size() const
Definition OperandIndexSequence.h:47

onert::ir::OperandIndexSequence::at
const OperandIndex & at(IOIndex set_index) const
Definition OperandIndexSequence.h:48

onert::ir::Operation::getOutputs
const OperandIndexSequence & getOutputs() const override
Definition Operation.h:53

onert::ir::Operation::getInputs
OperandIndexSequence & getInputs()
Definition Operation.h:51

onert::ir::operation::BinaryArithmetic::param
const Param & param() const
Definition BinaryArithmetic.h:59

onert::ir::operation::Conv2D::param
const Param & param() const
Definition Conv2D.h:56

onert::ir::operation::DepthwiseConv2D::param
const Param & param() const
Definition DepthwiseConv2D.h:57

onert::ir::operation::ElementwiseActivation::Type
Type
Definition ElementwiseActivation.h:34

onert::ir::operation::ElementwiseActivation::Type::RELU
@ RELU

onert::ir::operation::ElementwiseActivation::param
const Param & param() const
Definition ElementwiseActivation.h:60

onert::ir::operation::FullyConnected::param
const Param & param() const
Definition FullyConnected.h:53

onert::ir::operation::Pad::VALUE
@ VALUE
Definition Pad.h:32

onert::ir::operation::Pad::INPUT
@ INPUT
Definition Pad.h:30

onert::ir::operation::Pad::PAD
@ PAD
Definition Pad.h:31

onert::ir::operation::Pool2D::PoolType
PoolType
Definition Pool2D.h:38

onert::ir::operation::Pool2D::PoolType::MAX
@ MAX

onert::ir::operation::Pool2D::PoolType::AVG
@ AVG

onert::ir::operation::Pool2D::param
const Param & param() const
Definition Pool2D.h:64

onert::ir::operation::Pool2D::name
std::string name() const override
Definition Pool2D.cc:33

onert::ir::operation::Reduce::ReduceType::MEAN
@ MEAN

onert::ir::operation::Reduce::param
const Param & param() const
Definition Reduce.h:63

onert::ir::operation::Reshape::SHAPE
@ SHAPE
Definition Reshape.h:33

onert::ir::operation::Reshape::INPUT
@ INPUT
Definition Reshape.h:32

onert::ir::operation::Softmax::INPUT
@ INPUT
Definition Softmax.h:32

onert::ir::operation::Softmax::param
const Param & param() const
Definition Softmax.h:49

onert::ir::train::TrainableGraph
Definition TrainableGraph.h:32

onert::ir::train::TrainableGraph::operation
const ITrainableOperation & operation(OperationIndex index) const
Definition TrainableGraph.cc:171

onert::ir::train::TrainableGraph::operations
const Operations & operations() const override
Definition TrainableGraph.h:121

onert::ir::train::TrainableGraph::operands
const Operands & operands() const override
Definition TrainableGraph.h:119

onert::ir::train::TrainableGraph::trainingUseDefs
const UseDefChains & trainingUseDefs() const
Definition TrainableGraph.h:128

onert::ir::train::TrainableOperation::isRequiredForBackward
virtual bool isRequiredForBackward() const final
Definition TrainableOperation.h:39

onert::ir::train::TrainingIndex
Class that provides index of tensor for training.
Definition Index.h:34

onert::ir::train::operation::BinaryArithmetic
Definition BinaryArithmetic.h:27

onert::ir::train::operation::Conv2D
Definition Conv2D.h:27

onert::ir::train::operation::DepthwiseConv2D
Definition DepthwiseConv2D.h:27

onert::ir::train::operation::ElementwiseActivation
Definition ElementwiseActivation.h:27

onert::ir::train::operation::FullyConnected
Definition FullyConnected.h:27

onert::ir::train::operation::Loss
Definition Loss.h:30

onert::ir::train::operation::Loss::param
const LossInfo & param() const
Definition Loss.h:45

onert::ir::train::operation::Loss::y_pred_op_code
ir::OpCode y_pred_op_code() const
Definition Loss.h:46

onert::ir::train::operation::Pad
Definition Pad.h:27

onert::ir::train::operation::Pool2D
Definition Pool2D.h:27

onert::ir::train::operation::Reduce
Definition Reduce.h:27

onert::ir::train::operation::Reshape
Definition Reshape.h:27

onert::ir::train::operation::Softmax
Definition Softmax.h:27

onert::util::Index< uint32_t, OperationIndexTag >

onert::util::ObjectManager::iterate
void iterate(const std::function< void(const Index &, const Object &)> &fn) const
Iterate over the container with given function.
Definition ObjectManager.h:184

onert::util::ObjectManager::at
const Object & at(const Index &index) const
Get the object that is associated with the given index.
Definition ObjectManager.h:119

KernelGenerator.h

GenH5RandomInputs.input_index
input_index
Definition GenH5RandomInputs.py:60

locoex::FusedActFunc::UNDEFINED
@ UNDEFINED

onert::backend::acl_common::convertPoolType
arm_compute::PoolingType convertPoolType(ir::operation::Pool2D::PoolType pool_type_ir)
Definition Convert.cc:279

onert::backend::cpu::ops::ElementwiseActivationType::kReLU
@ kReLU

onert::backend::cpu::ops::ArithmeticType
ArithmeticType
Definition BinaryArithmeticLayer.h:29

onert::backend::cpu::ops::PoolType::kMax
@ kMax

onert::backend::cpu::ops::PoolType::kAvg
@ kAvg

onert::backend::train::ops::ElementwiseActivationType::kReLU
@ kReLU

onert::backend::train::ops::PoolType
PoolType
Definition PoolLayer.h:40

onert::backend::train::ops::PoolType::kMax
@ kMax

onert::backend::train::ops::PoolType::kAvg
@ kAvg

onert::backend::train::ops::ArithmeticType
ArithmeticType
Definition BinaryArithmeticLayer.h:30

onert::backend::train
Definition Backend.h:31

onert::backend::train::BackPropTensor
Tensor BackPropTensor
Definition Tensor.h:43

onert::ir::train::LossCode::MeanSquaredError
@ MeanSquaredError

onert::ir::train::LossCode::CategoricalCrossentropy
@ CategoricalCrossentropy

onert::ir::calculatePadding
const ExplicitPadding calculatePadding(const Padding &padding, const FeatureShape &ifm_shape, const FeatureShape &ofm_shape, const Stride &stride, uint32_t kw, uint32_t kh, uint32_t dwf=1, uint32_t dhf=1)
Definition Padding.cc:131

onert::ir::Remove
Remove
Definition OperandIndexSequence.h:29

onert::ir::Remove::UNDEFINED
@ UNDEFINED

onert::ir::OperationIndex
::onert::util::Index< uint32_t, OperationIndexTag > OperationIndex
Definition Index.h:30

onert::ir::OperandIndex
::onert::util::Index< uint32_t, OperandIndexTag > OperandIndex
Definition Index.h:33

optimizer
Definition __init__.py:1

Backend.h

logging.h

ker_tensor
CLTensor ker_tensor
Definition Convolution.cpp:293

bias_tensor
CLTensor bias_tensor
Definition Convolution.cpp:294

onert::ir::Dilation::height_factor
uint32_t height_factor
Definition InternalType.h:44

onert::ir::Dilation::width_factor
uint32_t width_factor
Definition InternalType.h:43

onert::ir::IOperation
Definition IOperation.h:32

onert::ir::operation::BinaryArithmetic::Param::arithmetic_type
ArithmeticType arithmetic_type
Definition BinaryArithmetic.h:45

onert::ir::operation::BinaryArithmetic::Param::activation
Activation activation
Definition BinaryArithmetic.h:46

onert::ir::operation::Conv2D::Param::padding
Padding padding
Definition Conv2D.h:42

onert::ir::operation::Conv2D::Param::dilation
Dilation dilation
Definition Conv2D.h:44

onert::ir::operation::Conv2D::Param::activation
Activation activation
Definition Conv2D.h:43

onert::ir::operation::Conv2D::Param::stride
Stride stride
Definition Conv2D.h:41

onert::ir::operation::DepthwiseConv2D::Param::padding
Padding padding
Definition DepthwiseConv2D.h:42

onert::ir::operation::DepthwiseConv2D::Param::stride
Stride stride
Definition DepthwiseConv2D.h:41

onert::ir::operation::DepthwiseConv2D::Param::dilation
Dilation dilation
Definition DepthwiseConv2D.h:45

onert::ir::operation::DepthwiseConv2D::Param::activation
Activation activation
Definition DepthwiseConv2D.h:44

onert::ir::operation::DepthwiseConv2D::Param::multiplier
uint32_t multiplier
Definition DepthwiseConv2D.h:43

onert::ir::operation::ElementwiseActivation::Param::op_type
Type op_type
Definition ElementwiseActivation.h:44

onert::ir::operation::ElementwiseActivation::Param::alpha
float alpha
Definition ElementwiseActivation.h:45

onert::ir::operation::ElementwiseActivation::Param::beta
float beta
Definition ElementwiseActivation.h:46

onert::ir::operation::FullyConnected::Param::activation
Activation activation
Definition FullyConnected.h:40

onert::ir::operation::FullyConnected::Param::weights_format
FullyConnectedWeightsFormat weights_format
Definition FullyConnected.h:41

onert::ir::operation::Pool2D::Param::padding
Padding padding
Definition Pool2D.h:50

onert::ir::operation::Pool2D::Param::kw
uint32_t kw
Definition Pool2D.h:48

onert::ir::operation::Pool2D::Param::stride
Stride stride
Definition Pool2D.h:49

onert::ir::operation::Pool2D::Param::kh
uint32_t kh
Definition Pool2D.h:47

onert::ir::operation::Pool2D::Param::activation
Activation activation
Definition Pool2D.h:51

onert::ir::operation::Pool2D::Param::op_type
PoolType op_type
Definition Pool2D.h:46

onert::ir::operation::Reduce::Param::reduce_type
ReduceType reduce_type
Definition Reduce.h:49

onert::ir::operation::Reduce::Param::keep_dims
bool keep_dims
Definition Reduce.h:50

onert::ir::operation::Softmax::Param::beta
float beta
Definition Softmax.h:37

onert::ir::train::LossInfo::loss_code
LossCode loss_code
Definition LossInfo.h:43

onert::ir::train::LossInfo::reduction_type
LossReductionType reduction_type
Definition LossInfo.h:44

onert::ir::train::LossInfo::loss_param
std::variant< std::monostate, CategoricalCrossentropyParam > loss_param
Definition LossInfo.h:45