ONE/compute_2cker_2include_2cker_2operation_2_broadcast_to_8h_source.html

/*

 * Copyright (c) 2020 Samsung Electronics Co., Ltd. All Rights Reserved

 * Copyright 2018 The TensorFlow Authors. All Rights Reserved.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef __NNFW_CKER_BROADCAST_TO_H__

#define __NNFW_CKER_BROADCAST_TO_H__


#include "cker/Types.h"

#include "cker/Shape.h"

#include "cker/Utils.h"


#include "cker/eigen/EigenSupport.h"


#include "cker/operation/Helper/Tensor.h"

#include "cker/operation/Helper/BCast.h"


#include <vector>


#define UNUSED(x) (void)(x)


namespace nnfw

{

namespace cker

{

namespace functor

{

static const int32_t kint32max = ((int32_t)0x7FFFFFFF);


template <typename Device, typename T> struct FillFunctor

{

  // Computes on device "d": out = out.constant(in(0)),

  void operator()(const Device &d, typename TTypes<T>::Flat out,

                  typename TTypes<T>::ConstScalar in);

};


template <typename T> struct FillFunctor<Eigen::ThreadPoolDevice, T>

{


  void operator()(const Eigen::ThreadPoolDevice &d, typename TTypes<T>::Flat out,

                  typename TTypes<T>::ConstScalar in)

  {

    out.device(d) = out.constant(in());

  }


};


template <typename Device, typename T> struct BroadcastTo

{

  template <int NDIMS>


  void DoBCast32Bit(const Device &device, typename TTypes<T, NDIMS>::Tensor out,

                    typename TTypes<T, NDIMS>::ConstTensor in,

                    const typename Eigen::array<int, NDIMS> &bcast) const

  {

    To32Bit(out).device(device) = To32Bit(in).broadcast(bcast);

  }


  template <int NDIMS>


  void DoBCast(const Device &device, typename TTypes<T, NDIMS>::Tensor out,

               typename TTypes<T, NDIMS>::ConstTensor in,

               const typename Eigen::array<Eigen::DenseIndex, NDIMS> &bcast) const

  {

    out.device(device) = in.broadcast(bcast);

  }


  template <int NDIMS>


  void ReshapeAndBCast(const Device &device, Tensor &output_tensor, const Tensor &input_tensor,

                       const BCast &bcast) const

  {

    const bool can_use_32bit = std::is_same<Eigen::GpuDevice, Device>::value &&

                               output_tensor.shape.FlatSize() < kint32max &&

                               input_tensor.shape.FlatSize() < kint32max;

    if (can_use_32bit)

    {

      DoBCast32Bit<NDIMS>(device, output_tensor.template shaped<T, NDIMS>(bcast.result_shape()),

                          input_tensor.template shaped<T, NDIMS>(bcast.x_reshape()),

                          BCast::ToIndexArrayType<int, NDIMS>(bcast.x_bcast()));

    }

    else

    {

      DoBCast<NDIMS>(device, output_tensor.template shaped<T, NDIMS>(bcast.result_shape()),

                     input_tensor.template shaped<T, NDIMS>(bcast.x_reshape()),

                     BCast::ToIndexArrayType<Eigen::DenseIndex, NDIMS>(bcast.x_bcast()));

    }

  }


  // PRECONDITION: rank(input_shape) > 0 &&

  //               rank(input_shape) <= rank(output_shape)  &&

  //               output_shape.num_elements() > 0.


  void operator()(const Device &device, Tensor &output_tensor, const Shape &output_shape,

                  const Tensor &input_tensor, const Shape &input_shape, const BCast &bcast) const

  {

    const int ndims = bcast.y_reshape().size();

    switch (ndims)

    {

      case 1:

        ReshapeAndBCast<1>(device, output_tensor, input_tensor, bcast);

        break;

      case 2:

        ReshapeAndBCast<2>(device, output_tensor, input_tensor, bcast);

        break;

      case 3:

        ReshapeAndBCast<3>(device, output_tensor, input_tensor, bcast);

        break;

      case 4:

        ReshapeAndBCast<4>(device, output_tensor, input_tensor, bcast);

        break;

      case 5:

        ReshapeAndBCast<5>(device, output_tensor, input_tensor, bcast);

        break;

      default:

        // NOTE : UNUSED leaves for maintenance purposes.

        UNUSED(output_shape);

        UNUSED(input_shape);

        break;

    }

  }


};


} // namespace functor


template <typename T>


inline void BroadcastTo(const Shape &input_shape, T *input_data, const Shape &output_shape,

                        T *output_data)

{

  const int input_flatsize = input_shape.FlatSize();


  if (input_shape == output_shape)

  {

    memcpy(output_data, input_data, input_flatsize * sizeof(T));

    return;

  }


  // Input shape's rank must be no greater than rank of output shape.

  assert(input_shape.DimensionsCount() <= output_shape.DimensionsCount());


  // It shouldn't be 0.

  assert(output_shape.DimensionsCount());


  Tensor output_tensor;

  Tensor input_tensor;


  input_tensor.shape.ReplaceWith(input_shape.DimensionsCount(), input_shape.DimsData());

  input_tensor.buffer = input_data;


  output_tensor.shape.ReplaceWith(output_shape.DimensionsCount(), output_shape.DimsData());

  output_tensor.buffer = output_data;


  const Eigen::ThreadPoolDevice &device = *eigen_support::GetThreadPoolDevice();


  // Handle broadcast from Scalar.

  if (input_flatsize == 0)

  {

    functor::FillFunctor<Eigen::ThreadPoolDevice, T>()(device, output_tensor.flat<T>(),

                                                       input_tensor.scalar<T>());

  }


  BCast bcast(BCast::FromShape(input_shape), BCast::FromShape(output_shape),

              /*fewer_dims_optimization=*/true);


  // Predict TRUE.

  assert(bcast.IsValid());

  // should be same.

  assert(BCast::ToShape(bcast.output_shape()) == output_shape);


  functor::BroadcastTo<Eigen::ThreadPoolDevice, T>()(device, output_tensor, output_shape,

                                                     input_tensor, input_shape, bcast);

}


} // namespace cker

} // namespace nnfw


#endif // __NNFW_CKER_BROADCAST_TO_H__

BCast.h

EigenSupport.h

nnfw::cker::BCast
Definition BCast.h:382

nnfw::cker::BCast::FromShape
static Vec FromShape(const Shape &shape)
Definition BCast.h:444

nnfw::cker::BCast::ToShape
static Shape ToShape(const BCastList::Vec &vec)
Definition BCast.h:455

nnfw::cker::BCast::result_shape
const Vec & result_shape() const
Definition BCast.h:409

nnfw::cker::BCast::x_reshape
const Vec & x_reshape() const
Definition BCast.h:405

nnfw::cker::BCast::y_reshape
const Vec & y_reshape() const
Definition BCast.h:407

nnfw::cker::BCast::output_shape
const Vec & output_shape() const
Definition BCast.h:410

nnfw::cker::BCast::x_bcast
const Vec & x_bcast() const
Definition BCast.h:406

nnfw::cker::BCastList::IsValid
bool IsValid() const
Definition BCast.h:96

nnfw::cker::Shape
Definition Shape.h:32

nnfw::cker::Shape::DimensionsCount
int32_t DimensionsCount() const
Definition Shape.h:91

nnfw::cker::Shape::ReplaceWith
void ReplaceWith(int dimensions_count, const int32_t *dims_data)
Definition Shape.h:130

nnfw::cker::Shape::FlatSize
int FlatSize() const
Definition Shape.h:181

nnfw::cker::Shape::DimsData
int32_t * DimsData()
Definition Shape.h:112

Shape.h

Types.h

Utils.h

UNUSED
#define UNUSED(x)
Definition BatchToSpaceND.h:23

Tensor.h

output_shape
const luci_interpreter::RuntimeShape output_shape
Definition PALComparisons.h:32

Eigen
Definition eigen_backward_spatial_convolutions.h:25

nnfw::cker::eigen_support::GetThreadPoolDevice
const Eigen::ThreadPoolDevice * GetThreadPoolDevice()
Definition EigenSupport.h:110

nnfw::cker::BroadcastTo
void BroadcastTo(const Shape &input_shape, T *input_data, const Shape &output_shape, T *output_data)
Definition BroadcastTo.h:132

nnfw::cker::To32Bit
TTypes< typenameTensorType::Scalar, TensorType::NumIndices >::Tensor32Bit To32Bit(TensorType in)
Definition Tensor.h:178

nnfw
Definition topk_v2.h:30

nnfw::cker::TTypes::ConstScalar
Eigen::TensorMap< Eigen::TensorFixedSize< const T, Eigen::Sizes<>, Eigen::RowMajor, IndexType >, Eigen::Aligned > ConstScalar
Definition Tensor.h:51

nnfw::cker::TTypes::ConstTensor
Eigen::TensorMap< Eigen::Tensor< const T, NDIMS, Eigen::RowMajor, IndexType >, Eigen::Aligned > ConstTensor
Definition Tensor.h:35

nnfw::cker::TTypes::Flat
Eigen::TensorMap< Eigen::Tensor< T, 1, Eigen::RowMajor, IndexType >, Eigen::Aligned > Flat
Definition Tensor.h:61

nnfw::cker::TTypes::Tensor
Eigen::TensorMap< Eigen::Tensor< T, NDIMS, Eigen::RowMajor, IndexType >, Eigen::Aligned > Tensor
Definition Tensor.h:32

nnfw::cker::Tensor
Definition Tensor.h:95

nnfw::cker::Tensor::scalar
TTypes< T >::ConstScalar scalar() const
Definition Tensor.h:156

nnfw::cker::Tensor::shape
Shape shape
Definition Tensor.h:96

nnfw::cker::Tensor::buffer
void * buffer
Definition Tensor.h:97

nnfw::cker::functor::BroadcastTo
Definition BroadcastTo.h:59

nnfw::cker::functor::BroadcastTo::DoBCast32Bit
void DoBCast32Bit(const Device &device, typename TTypes< T, NDIMS >::Tensor out, typename TTypes< T, NDIMS >::ConstTensor in, const typename Eigen::array< int, NDIMS > &bcast) const
Definition BroadcastTo.h:61

nnfw::cker::functor::BroadcastTo::operator()
void operator()(const Device &device, Tensor &output_tensor, const Shape &output_shape, const Tensor &input_tensor, const Shape &input_shape, const BCast &bcast) const
Definition BroadcastTo.h:100

nnfw::cker::functor::BroadcastTo::ReshapeAndBCast
void ReshapeAndBCast(const Device &device, Tensor &output_tensor, const Tensor &input_tensor, const BCast &bcast) const
Definition BroadcastTo.h:77

nnfw::cker::functor::BroadcastTo::DoBCast
void DoBCast(const Device &device, typename TTypes< T, NDIMS >::Tensor out, typename TTypes< T, NDIMS >::ConstTensor in, const typename Eigen::array< Eigen::DenseIndex, NDIMS > &bcast) const
Definition BroadcastTo.h:69

nnfw::cker::functor::FillFunctor< Eigen::ThreadPoolDevice, T >::operator()
void operator()(const Eigen::ThreadPoolDevice &d, typename TTypes< T >::Flat out, typename TTypes< T >::ConstScalar in)
Definition BroadcastTo.h:51

nnfw::cker::functor::FillFunctor
Definition BroadcastTo.h:43

nnfw::cker::functor::FillFunctor::operator()
void operator()(const Device &d, typename TTypes< T >::Flat out, typename TTypes< T >::ConstScalar in)