ONE/passes_2optimizations_2_fuse_arithmetic_ops_8cpp_source.html

/*

 * Copyright (c) 2019 Samsung Electronics Co., Ltd. All Rights Reserved

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *    http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#include "passes/optimizations/FuseArithmeticOps.h"

#include "passes/optimizations/OptimizationUtils.h"

#include "mir/ops/AddOp.h"

#include "mir/ops/ConstantOp.h"

#include "mir/ops/Conv2DOp.h"

#include "mir/ops/MulOp.h"

#include "mir/Graph.h"

#include "mir/Tensor.h"

#include "mir/Index.h"

#include "mir/TensorVariant.h"

#include "mir/ShapeRange.h"


#include <algorithm>


namespace nnc

{


namespace

{


using namespace mir;

using namespace std;

using namespace opt_util;


using OpType = Operation::Type;

using Edge = pair<Operation *, Operation *>;


ops::ConstantOp *getSecondInputAsConst(Operation *op)

{

  assert(op->getType() == OpType::add || op->getType() == OpType::mul ||

         op->getType() == OpType::conv2D);

  return dynamic_cast<ops::ConstantOp *>(op->getInput(1)->getNode());

}


// This function finds successive operations of given types, with ConstantOp as second input

vector<Edge> findSuccessiveOpsWithConstWeights(Graph *g, OpType first_op_type,

                                               OpType second_op_type)

{

  vector<Edge> matches;

  unordered_set<Operation *> matched_nodes;

  for (auto *first_op : g->getNodes())

  {

    if (first_op->getType() == first_op_type && getSecondInputAsConst(first_op))

    {

      for (auto &out : first_op->getOutputs())

      {

        for (Operation::Use use : out.getUses())

        {

          Operation *second_op = use.getNode();

          if (second_op->getType() == second_op_type && getSecondInputAsConst(second_op))

          {

            if (matched_nodes.find(first_op) == matched_nodes.end() &&

                matched_nodes.find(second_op) == matched_nodes.end())

            {

              matched_nodes.emplace(first_op);

              matched_nodes.emplace(second_op);

              matches.emplace_back(first_op, second_op);

            }

          }

        }

      }

    }

  }

  return matches;

}


Operation *mergeConstantOps(Graph *g, const ops::ConstantOp *const1_op,

                            const ops::ConstantOp *const2_op, OpType merge_type)

{

  const auto &const1_val = const1_op->getValue();

  const auto &const2_val = const2_op->getValue();

  assert(const1_val.getShape().rank() >= const2_val.getShape().rank());

  assert(const2_val.getShape().rank() == 1);

  assert(const1_val.getShape().dim(0) == const2_val.getShape().dim(0));


  // Create and fill TensorVariant for new ConstantOp

  TensorVariant new_const_val(DataType::FLOAT32, const1_val.getShape());

  Tensor<float> const1_accessor(const1_val);

  Tensor<float> const2_accessor(const2_val);

  Tensor<float> new_const_accessor(new_const_val);

  ShapeRange const1_range(const1_val.getShape());

  for (auto &idx : const1_range)

  {

    float operand1 = const1_accessor.at(idx);

    float operand2 = const2_accessor.at(Index{idx.at(0)});

    switch (merge_type)

    {

      case OpType::mul:

        new_const_accessor.at(idx) = operand1 * operand2;

        break;

      case OpType::add:

        new_const_accessor.at(idx) = operand1 + operand2;

        break;

      default:

        assert(false && "only 'mul' and 'add' constants merge types supported");

    }

  }


  return g->create<ops::ConstantOp>(new_const_val);

}


// TODO: support 'DepthwiseConv'->'Mul'

bool fuseSuccessiveOps(Graph *g)

{

  // Find all successive ops

  vector<Edge> successive_ops;

  auto mul_mul_vec = findSuccessiveOpsWithConstWeights(g, OpType::mul, OpType::mul);

  successive_ops.insert(successive_ops.end(), mul_mul_vec.begin(), mul_mul_vec.end());

  auto add_add_vec = findSuccessiveOpsWithConstWeights(g, OpType::add, OpType::add);

  successive_ops.insert(successive_ops.end(), add_add_vec.begin(), add_add_vec.end());

  auto conv_mul_vec = findSuccessiveOpsWithConstWeights(g, OpType::conv2D, OpType::mul);

  successive_ops.insert(successive_ops.end(), conv_mul_vec.begin(), conv_mul_vec.end());


  for (auto &edge : successive_ops)

  {

    auto const1_op = getSecondInputAsConst(edge.first);

    auto const2_op = getSecondInputAsConst(edge.second);

    assert(const1_op && const2_op);


    // Create new constant operation and copy first successive operation

    auto new_const_op = mergeConstantOps(g, const1_op, const2_op, edge.second->getType());

    auto first_op_input = edge.first->getInput(0);

    auto new_op = g->copyOpWithInputs(edge.first, {first_op_input, new_const_op->getOutput(0)});


    // Replace second successive operation with new one and remove old nodes

    g->replaceNode(edge.second, new_op);

    removeNodeIfUnused(g, edge.first);

    removeNodeIfUnused(g, const1_op);

    removeNodeIfUnused(g, const2_op);

  }


  // If there is no successive operations to fuse - graph wasn't changed

  return !successive_ops.empty();

}


bool sinkAddThroughMul(Graph *g)

{

  auto add_mul_edges = findSuccessiveOpsWithConstWeights(g, OpType::add, OpType::mul);


  for (auto &edge : add_mul_edges)

  {

    auto old_add_op = edge.first;

    auto old_mul_op = edge.second;

    auto old_add_const_op = getSecondInputAsConst(old_add_op);

    auto ols_mul_const_op = getSecondInputAsConst(old_mul_op);

    assert(old_add_const_op && ols_mul_const_op);


    // Create new operations

    auto old_add_input = old_add_op->getInput(0);

    auto new_mul_op =

      g->copyOpWithInputs(old_mul_op, {old_add_input, ols_mul_const_op->getOutput(0)});

    auto new_add_const_op = mergeConstantOps(g, old_add_const_op, ols_mul_const_op, OpType::mul);

    auto new_add_op =

      g->copyOpWithInputs(old_add_op, {new_mul_op->getOutput(0), new_add_const_op->getOutput(0)});


    // Replace old mul with new add and remove old nodes

    g->replaceNode(old_mul_op, new_add_op);

    removeNodeIfUnused(g, old_add_op);

    removeNodeIfUnused(g, old_add_const_op);

  }


  // If there is no add-mul edges - graph wasn't changed

  return !add_mul_edges.empty();

}


} // unnamed namespace


nnc::PassData nnc::FuseArithmeticOps::run(nnc::PassData data)

{

  auto g = static_cast<Graph *>(data);


  bool graph_changed = true;

  while (graph_changed)

  {

    graph_changed = false;

    graph_changed |= fuseSuccessiveOps(g);

    graph_changed |= sinkAddThroughMul(g);

  }


  return g;

}

nnc::PassData nnc::FuseArithmeticOps::run(nnc::PassData data) {…}


} // namespace nnc

AddOp.h

ConstantOp.h

Conv2DOp.h

FuseArithmeticOps.h

MulOp.h

OptimizationUtils.h

ShapeRange.h

TensorVariant.h

Tensor
Definition tensor_gen.cpp:32

mir::Graph
Definition Graph.h:35

mir::Index
Definition Index.h:32

mir::Index::at
int32_t & at(int32_t axis)
return position on given axis
Definition Index.h:64

mir::ShapeRange
Definition ShapeRange.h:82

mir::TensorVariant
Definition TensorVariant.h:33

mir::ops::ConstantOp
Definition ConstantOp.h:29

mir::ops::ConstantOp::getValue
const TensorVariant & getValue() const
Definition ConstantOp.h:36

nnc::FuseArithmeticOps::run
PassData run(PassData data) override
run compiler pass
Definition FuseArithmeticOps.cpp:235

nnc::PassData
class that encapsulate value returned and taken by pass
Definition PassData.h:30

Graph.h

Index.h

Tensor.h

GenH5RandomInputs.g
g
Definition GenH5RandomInputs.py:62

mir
Definition Attributes.h:25

nnc::opt_util::removeNodeIfUnused
void removeNodeIfUnused(mir::Graph *g, mir::Operation *op)
Definition OptimizationUtils.cpp:48

nnc
Definition AclCppGenerator.cpp:26

std
Definition CircleExporterUtils.h:53

Operation
Definition Operation.h:26