ONE/onert-micro_2include_2execute_2kernels_2_comparison_common_8h_source.html

/*

 * Copyright (c) 2024 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *    http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef ONERT_MICRO_EXECUTE_KERNELS_COMPARISONCOMMON_H

#define ONERT_MICRO_EXECUTE_KERNELS_COMPARISONCOMMON_H


#include "OMStatus.h"


#include "core/OMUtils.h"

#include "execute/OMUtils.h"

#include "core/OMKernelData.h"

#include "execute/OMRuntimeKernel.h"


#include "PALComparisons.h"


namespace onert_micro

{

namespace execute

{


namespace

{


constexpr uint32_t input1TensorIdx = 0;

constexpr uint32_t input2TensorIdx = 1;

constexpr uint32_t outputTensorIdx = 0;


} // namespace


template <typename T>


void readDataKernel(OMRuntimeKernel *runtime_kernel, const T *&cast_input_data1,

                    const T *&cast_input_data2, bool *&cast_output_data,

                    core::OMRuntimeShape &input1_shape_ref, core::OMRuntimeShape &input2_shape_ref,

                    core::OMRuntimeShape &output_shape_ref)

{

  const circle::Tensor *input1 = nullptr;

  const circle::Tensor *input2 = nullptr;

  const circle::Tensor *output = nullptr;


  uint8_t *input_data1 = nullptr;

  uint8_t *input_data2 = nullptr;

  uint8_t *output_data = nullptr;


  input1 = runtime_kernel->inputs[input1TensorIdx];

  input2 = runtime_kernel->inputs[input2TensorIdx];

  output = runtime_kernel->outputs[outputTensorIdx];


  assert(input1 != nullptr);

  assert(input2 != nullptr);

  assert(output != nullptr);


  input_data1 = runtime_kernel->inputs_data[input1TensorIdx];

  input_data2 = runtime_kernel->inputs_data[input2TensorIdx];

  output_data = runtime_kernel->outputs_data[outputTensorIdx];


  assert(input_data1 != nullptr);

  assert(input_data2 != nullptr);

  assert(output_data != nullptr);


  cast_input_data1 = core::utils::castInputData<T>(input_data1);

  cast_input_data2 = core::utils::castInputData<T>(input_data2);

  cast_output_data = core::utils::castOutputData<bool>(output_data);


  input1_shape_ref = std::move(core::OMRuntimeShape(input1));

  input2_shape_ref = std::move(core::OMRuntimeShape(input2));

  output_shape_ref = std::move(core::OMRuntimeShape(output));

}

void readDataKernel(OMRuntimeKernel *runtime_kernel, const T *&cast_input_data1, {…}


template <typename T> void evalComparisonGeneric(OMRuntimeKernel *runtime_kernel, bool F(T, T))

{


  const T *cast_input_data1 = nullptr;

  const T *cast_input_data2 = nullptr;

  bool *cast_output_data = nullptr;


  core::OMRuntimeShape input1_shape;

  core::OMRuntimeShape input2_shape;

  core::OMRuntimeShape output_shape;


  readDataKernel(runtime_kernel, cast_input_data1, cast_input_data2, cast_output_data, input1_shape,

                 input2_shape, output_shape);


  onert_micro::core::ComparisonParams op_params;

  op_params.is_broadcast = input1_shape.flatSize() != input2_shape.flatSize();


  if (op_params.is_broadcast)

  {

    onert_micro::execute::pal::BroadcastComparison4DSlowNoScaling<T>(

      op_params, input1_shape, cast_input_data1, input2_shape, cast_input_data2, output_shape,

      cast_output_data, F);

  }

  else

  {

    const int64_t flat_size = input1_shape.flatSize();

    onert_micro::execute::pal::ComparisonNoScaling<T>(flat_size, cast_input_data1, cast_input_data2,

                                                      cast_output_data, F);

  }

}

template <typename T> void evalComparisonGeneric(OMRuntimeKernel *runtime_kernel, bool F(T, T)) {…}


template <typename T, typename AccType>


void evalQuantizedComparisonGeneric(OMRuntimeKernel *runtime_kernel, bool F(AccType, AccType))

{

  const circle::Tensor *input1 = nullptr;

  const circle::Tensor *input2 = nullptr;

  const circle::Tensor *output = nullptr;


  input1 = runtime_kernel->inputs[input1TensorIdx];

  input2 = runtime_kernel->inputs[input2TensorIdx];

  output = runtime_kernel->outputs[outputTensorIdx];


  assert(input1 != nullptr);

  assert(input2 != nullptr);

  assert(output != nullptr);


  const T *cast_input_data1 = nullptr;

  const T *cast_input_data2 = nullptr;

  bool *cast_output_data = nullptr;


  core::OMRuntimeShape input1_shape;

  core::OMRuntimeShape input2_shape;

  core::OMRuntimeShape output_shape;


  readDataKernel(runtime_kernel, cast_input_data1, cast_input_data2, cast_output_data, input1_shape,

                 input2_shape, output_shape);


  assert(input1->quantization() != nullptr);

  assert(input1->quantization()->scale() != nullptr);

  assert(input1->quantization()->scale()->size() == 1);

  assert(input1->quantization()->zero_point() != nullptr);

  assert(input1->quantization()->zero_point()->size() == 1);


  auto input1_scale = *input1->quantization()->scale()->begin();

  auto input2_scale = *input2->quantization()->scale()->begin();


  auto input1_zero_point = *input1->quantization()->zero_point()->begin();

  auto input2_zero_point = *input2->quantization()->zero_point()->begin();


  int32_t x_multiplier;

  int x_shift;


  int32_t y_multiplier;

  int y_shift;


  onert_micro::execute::quantizeMultiplierSmallerThanOneExp(input1_scale, &x_multiplier, &x_shift);

  onert_micro::execute::quantizeMultiplierSmallerThanOneExp(input2_scale, &y_multiplier, &y_shift);


  onert_micro::core::ComparisonParams op_params;

  op_params.left_shift = 8;

  op_params.input1_offset = -input1_zero_point; // Note the '-'

  op_params.input1_shift = x_shift;

  op_params.input1_multiplier = x_multiplier;

  op_params.input2_offset = -input2_zero_point; // Note the '-'

  op_params.input2_shift = y_shift;

  op_params.input2_multiplier = y_multiplier;

  op_params.is_broadcast = input1_shape.flatSize() != input2_shape.flatSize();

  ;


  if (op_params.is_broadcast)

  {

    onert_micro::execute::pal::BroadcastComparison4DSlowWithScaling<T>(

      op_params, input1_shape, cast_input_data1, input2_shape, cast_input_data2, output_shape,

      cast_output_data, F);

  }

  else

  {

    const int64_t flat_size = input1_shape.flatSize();

    onert_micro::execute::pal::ComparisonWithScaling<T>(op_params, flat_size, cast_input_data1,

                                                        cast_input_data2, cast_output_data, F);

  }

}

void evalQuantizedComparisonGeneric(OMRuntimeKernel *runtime_kernel, bool F(AccType, AccType)) {…}


} // namespace execute

} // namespace onert_micro


#endif // ONERT_MICRO_EXECUTE_KERNELS_COMPARISONCOMMON_H

OMKernelData.h

OMRuntimeKernel.h

OMStatus.h

onert_micro::core::OMRuntimeShape
Definition OMRuntimeShape.h:34

onert_micro::core::OMRuntimeShape::flatSize
int flatSize() const
Definition OMRuntimeShape.h:64

onert_micro::execute::OMRuntimeKernel
Definition OMRuntimeKernel.h:35

onert_micro::execute::OMRuntimeKernel::outputs_data
uint8_t * outputs_data[maxOutputSize]
Definition OMRuntimeKernel.h:55

onert_micro::execute::OMRuntimeKernel::inputs_data
uint8_t * inputs_data[maxInputSize]
Definition OMRuntimeKernel.h:54

onert_micro::execute::OMRuntimeKernel::outputs
const circle::Tensor * outputs[maxOutputSize]
Definition OMRuntimeKernel.h:52

onert_micro::execute::OMRuntimeKernel::inputs
const circle::Tensor * inputs[maxInputSize]
Definition OMRuntimeKernel.h:51

OMUtils.h

OMUtils.h

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

TensorIndexTISO::input1TensorIdx
constexpr uint32_t input1TensorIdx
Definition ReadKernelDataCommon.cpp:26

TensorIndexTISO::outputTensorIdx
constexpr uint32_t outputTensorIdx
Definition ReadKernelDataCommon.cpp:28

TensorIndexTISO::input2TensorIdx
constexpr uint32_t input2TensorIdx
Definition ReadKernelDataCommon.cpp:27

onert_micro::execute::readDataKernel
void readDataKernel(OMRuntimeKernel *runtime_kernel, const T *&cast_input_data1, const T *&cast_input_data2, bool *&cast_output_data, core::OMRuntimeShape &input1_shape_ref, core::OMRuntimeShape &input2_shape_ref, core::OMRuntimeShape &output_shape_ref)
Definition ComparisonCommon.h:44

onert_micro::execute::quantizeMultiplierSmallerThanOneExp
void quantizeMultiplierSmallerThanOneExp(double double_multiplier, int32_t *quantized_multiplier, int *left_shift)
Definition OMUtils.cpp:60

onert_micro::execute::evalComparisonGeneric
void evalComparisonGeneric(OMRuntimeKernel *runtime_kernel, bool F(T, T))
Definition ComparisonCommon.h:82

onert_micro::execute::evalQuantizedComparisonGeneric
void evalQuantizedComparisonGeneric(OMRuntimeKernel *runtime_kernel, bool F(AccType, AccType))
Definition ComparisonCommon.h:114

onert_micro
Definition OMMemoryManager.h:26

onert_micro::core::ComparisonParams
Definition OMKernelData.h:206

onert_micro::core::ComparisonParams::left_shift
int left_shift
Definition OMKernelData.h:208

onert_micro::core::ComparisonParams::is_broadcast
bool is_broadcast
Definition OMKernelData.h:216

onert_micro::core::ComparisonParams::input2_shift
int input2_shift
Definition OMKernelData.h:214

onert_micro::core::ComparisonParams::input1_shift
int input1_shift
Definition OMKernelData.h:211

onert_micro::core::ComparisonParams::input2_offset
int32_t input2_offset
Definition OMKernelData.h:212

onert_micro::core::ComparisonParams::input2_multiplier
int32_t input2_multiplier
Definition OMKernelData.h:213

onert_micro::core::ComparisonParams::input1_offset
int32_t input1_offset
Definition OMKernelData.h:209

onert_micro::core::ComparisonParams::input1_multiplier
int32_t input1_multiplier
Definition OMKernelData.h:210