ONE/compute_2cker_2include_2cker_2operation_2optimized_2_batch_mat_mul_8h_source.html

/*

 * Copyright (c) 2024 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef __NNFW_CKER_OPTIMIZED_BATCH_MATMUL_H__

#define __NNFW_CKER_OPTIMIZED_BATCH_MATMUL_H__


#include "cker/Shape.h"

#include "cker/operation/Helper/BatchMatMulParams.h"

#include "cker/operation/optimized/Gemm.h"


namespace nnfw

{

namespace cker

{


namespace optimized

{

#if defined(CKER_X86_PLATFORM)


inline void BatchMatMul(const BatchMatMulParams &params, const float *lhs_data,

                        const float *rhs_data, float *output_data)

{

  MatrixParams<float> lhs_params;

  lhs_params.order = Order::kRowMajor; // ignored by GemmImplUsingEigen

  lhs_params.rows = params.lhs_rows;

  lhs_params.cols = params.lhs_cols;


  MatrixParams<float> rhs_params;

  lhs_params.order = Order::kRowMajor; // ignored by GemmImplUsingEigen

  rhs_params.rows = params.rhs_rows;

  rhs_params.cols = params.rhs_cols;


  MatrixParams<float> dst_params;

  lhs_params.order = Order::kRowMajor; // ignored by GemmImplUsingEigen

  dst_params.rows = params.lhs_rows;

  dst_params.cols = params.rhs_cols;


  for (int b0 = 0; b0 < params.batch_dim0; ++b0)

  {

    for (int b1 = 0; b1 < params.batch_dim1; ++b1)

    {

      for (int b2 = 0; b2 < params.batch_dim2; ++b2)

      {

        const float *lhs_ptr =

          lhs_data + b0 * params.lhs_ext0 + b1 * params.lhs_ext1 + b2 * params.lhs_ext2;

        const float *rhs_ptr =

          rhs_data + b0 * params.rhs_ext0 + b1 * params.rhs_ext1 + b2 * params.rhs_ext2;

        float *out_ptr = output_data + ((b0 * params.batch_dim1 * params.batch_dim2) +

                                        b1 * params.batch_dim2 + b2) *

                                         params.lhs_rows * params.rhs_cols;


        optimized::Gemm(lhs_params, lhs_ptr, rhs_params, rhs_ptr, dst_params, out_ptr,

                        GemmParams<float, float>{});

      }

    }

  }

}

#endif

} // namespace optimized


} // namespace cker

} // namespace nnfw


#endif // __NNFW_CKER_OPTIMIZED_BATCH_MATMUL_H__

BatchMatMulParams.h

nnfw::cker::BatchMatMul
Definition BatchMatMul.h:37

Shape.h

Gemm.h

nnfw::cker::Order::kRowMajor
@ kRowMajor

nnfw
Definition topk_v2.h:30

nnfw::cker::BatchMatMulParams
Definition BatchMatMulParams.h:27

nnfw::cker::BatchMatMulParams::lhs_rows
int lhs_rows
Definition BatchMatMulParams.h:61

nnfw::cker::BatchMatMulParams::rhs_rows
int rhs_rows
Definition BatchMatMulParams.h:63

nnfw::cker::BatchMatMulParams::rhs_ext2
int rhs_ext2
Definition BatchMatMulParams.h:60

nnfw::cker::BatchMatMulParams::rhs_ext1
int rhs_ext1
Definition BatchMatMulParams.h:59

nnfw::cker::BatchMatMulParams::batch_dim0
int batch_dim0
Definition BatchMatMulParams.h:52

nnfw::cker::BatchMatMulParams::batch_dim2
int batch_dim2
Definition BatchMatMulParams.h:54

nnfw::cker::BatchMatMulParams::rhs_cols
int rhs_cols
Definition BatchMatMulParams.h:64

nnfw::cker::BatchMatMulParams::lhs_ext1
int lhs_ext1
Definition BatchMatMulParams.h:56

nnfw::cker::BatchMatMulParams::lhs_cols
int lhs_cols
Definition BatchMatMulParams.h:62

nnfw::cker::BatchMatMulParams::lhs_ext2
int lhs_ext2
Definition BatchMatMulParams.h:57

nnfw::cker::BatchMatMulParams::rhs_ext0
int rhs_ext0
Definition BatchMatMulParams.h:58

nnfw::cker::BatchMatMulParams::batch_dim1
int batch_dim1
Definition BatchMatMulParams.h:53

nnfw::cker::BatchMatMulParams::lhs_ext0
int lhs_ext0
Definition BatchMatMulParams.h:55

nnfw::cker::GemmParams
Definition Types.h:509

nnfw::cker::MatrixParams
Definition Types.h:439

nnfw::cker::MatrixParams::cols
int cols
Definition Types.h:446

nnfw::cker::MatrixParams::rows
int rows
Definition Types.h:444

nnfw::cker::MatrixParams::order
Order order
Definition Types.h:442