ONE/backend_2acl__neon_2ops_2_split_8cc_source.html

/*

 * Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "../KernelGenerator.h"

#include "../Validator.h"


#include <AclKernelGen.h>


namespace onert::backend::acl_neon

{


void Validator::visit(const ir::operation::Split &) { _supported = true; }


void KernelGenerator::visit(const ir::operation::Split &node)

{

  // TODO Support this op by SubTensor

  const auto ifm_index{node.getInputs().at(ir::operation::Split::Input::INPUT)};

  const auto axis_index{node.getInputs().at(ir::operation::Split::Input::AXIS)};


  assert(node.param().num_splits == static_cast<int>(node.getOutputs().size()));

  if (!_ctx.at(axis_index).isConstant())

  {

    throw std::runtime_error("Non-constant axis_index NYI for acl_neon backend");

  }


  const auto ifm_rank = _ctx.at(ifm_index).shape().rank();

  std::vector<ir::OperandIndex> output_indexes;

  for (const auto &output : node.getOutputs())

    output_indexes.emplace_back(output);


  auto ifm_tensor = _tensor_reg->getAclTensor(ifm_index);

  std::vector<arm_compute::ITensor *> output_tensors;

  for (const auto &ofm_ind : output_indexes)

    output_tensors.emplace_back(_tensor_reg->getAclTensor(ofm_ind)->handle());


  auto axis = _ctx.at(axis_index).asScalar<int32_t>();

  if (axis < 0)

    axis += ifm_rank;

  axis = acl_common::ToARMComputeAxis(ifm_rank, axis).value();


  auto fn =

    acl_common::generateLayer<arm_compute::NESplit>(ifm_tensor->handle(), output_tensors, axis);


  _return_fn = acl_common::asAclFunction(std::move(fn));

}


} // namespace onert::backend::acl_neon

AclKernelGen.h

onert::backend::ValidatorBase::_supported
bool _supported
Definition ValidatorBase.h:50

onert::backend::acl_common::ARMComputeAxis::value
uint32_t value(void) const
Definition Swizzle.h:38

onert::backend::basic::KernelGeneratorBase::_return_fn
std::unique_ptr< exec::IFunction > _return_fn
Definition KernelGeneratorBase.h:60

onert::ir::operation::Split::INPUT
@ INPUT
Definition Split.h:29

onert::ir::operation::Split::AXIS
@ AXIS
Definition Split.h:28

onert::util::ObjectManager::at
const Object & at(const Index &index) const
Get the object that is associated with the given index.
Definition ObjectManager.h:119

gen_h5_explicit_inputs_all.output
output
Definition gen_h5_explicit_inputs_all.py:96

onert::backend::acl_common::ToARMComputeAxis
ARMComputeAxis ToARMComputeAxis(uint32_t rank, uint32_t axis)
Definition Swizzle.h:45

onert::backend::acl_common::asAclFunction
std::unique_ptr< AclFunction > asAclFunction(std::unique_ptr<::arm_compute::IFunction > &&layer)
Definition Convert.cc:246

onert::backend::acl_neon
Definition Backend.h:33