fusion_conv_add_relu_op.h 3.1 KB
Newer Older
L
liuruilong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

Z
zhangyang 已提交
15
#ifdef FUSION_CONVADDRELU_OP
L
liuruilong 已提交
16

L
liuruilong 已提交
17 18
#pragma once

19 20
#include <string>
#include <vector>
L
liuruilong 已提交
21 22
#include "framework/operator.h"
#include "framework/program/program-optimize/fusion_op_register.h"
L
liuruilong 已提交
23 24
#include "operators/kernel/conv_add_relu_kernel.h"
#include "operators/op_param.h"
L
liuruilong 已提交
25 26 27 28

namespace paddle_mobile {
namespace operators {

L
liuruilong 已提交
29
class FusionConvAddReluOpMatcher : public framework::FusionOpMatcher {
L
liuruilong 已提交
30
 public:
L
liuruilong 已提交
31
  FusionConvAddReluOpMatcher() {
L
liuruilong 已提交
32 33 34
    node_ = framework::Node(G_OP_TYPE_CONV);
    node_ > std::make_shared<framework::Node>(G_OP_TYPE_ELEMENTWISE_ADD) >
        std::make_shared<framework::Node>(G_OP_TYPE_RELU);
L
liuruilong 已提交
35 36
  }

L
liuruilong 已提交
37 38 39
  void FolderNodes(
      framework::Node *node,
      std::vector<std::shared_ptr<framework::Node>> *removed_nodes) {
L
liuruilong 已提交
40
    node->Folder(node_.Depth(), Type(),
E
eclipsess 已提交
41
                 {{G_OP_TYPE_ELEMENTWISE_ADD, {{"Y", "Y"}}}}, removed_nodes);
L
liuruilong 已提交
42
  }
L
liuruilong 已提交
43
  std::string Type() { return G_OP_TYPE_FUSION_CONV_ADD_RELU; }
L
liuruilong 已提交
44 45
};

L
liuruilong 已提交
46
template <typename DeviceType, typename T>
L
liuruilong 已提交
47
class FusionConvAddReluOp : public framework::OperatorWithKernel<
L
liuruilong 已提交
48
                                DeviceType, FusionConvAddReluParam,
L
liuruilong 已提交
49
                                operators::ConvAddReluKernel<DeviceType, T>> {
L
liuruilong 已提交
50
 public:
L
liuruilong 已提交
51
  FusionConvAddReluOp(const string &type, const VariableNameMap &inputs,
L
liuruilong 已提交
52 53 54 55
                      const VariableNameMap &outputs,
                      const framework::AttributeMap &attrs,
                      std::shared_ptr<framework::Scope> scope)
      : framework::OperatorWithKernel<
L
liuruilong 已提交
56
            DeviceType, FusionConvAddReluParam,
L
liuruilong 已提交
57 58
            operators::ConvAddReluKernel<DeviceType, T>>(type, inputs, outputs,
                                                         attrs, scope) {}
L
liuruilong 已提交
59 60

  using framework::OperatorWithKernel<
L
liuruilong 已提交
61
      DeviceType, FusionConvAddReluParam,
L
liuruilong 已提交
62
      operators::ConvAddReluKernel<DeviceType, T>>::OperatorWithKernel;
L
liuruilong 已提交
63
  void InferShape() const override;
L
liuruilong 已提交
64

L
liuruilong 已提交
65
 protected:
L
liuruilong 已提交
66 67
};

L
for  
liuruilong 已提交
68
#ifdef PADDLE_MOBILE_CPU
L
liuruilong 已提交
69

70 71 72 73 74
#ifndef CONV_ADD_RELU_REGISTER
#define CONV_ADD_RELU_REGISTER
static framework::FusionOpRegistrar fusion_conv_add_relu_registrar(
    new FusionConvAddReluOpMatcher());
#endif
L
liuruilong 已提交
75

L
for  
liuruilong 已提交
76 77 78 79
#endif
#ifdef PADDLE_MOBILE_MALI_GPU
#endif
#ifdef PADDLE_MOBILE_FPGA
Z
zhangyang 已提交
80 81 82 83 84 85 86

#ifndef CONV_ADD_RELU_REGISTER
#define CONV_ADD_RELU_REGISTER
static framework::FusionOpRegistrar fusion_conv_add_relu_registrar(
    new FusionConvAddReluOpMatcher());
#endif

L
for  
liuruilong 已提交
87
#endif
L
liuruilong 已提交
88

L
liuruilong 已提交
89 90
}  // namespace operators
}  // namespace paddle_mobile
L
liuruilong 已提交
91

92 93 94 95 96 97
#ifdef PADDLE_MOBILE_CPU
USE_OP_CPU(fusion_conv_add_relu);
#endif
#ifdef PADDLE_MOBILE_MALI_GPU
#endif
#ifdef PADDLE_MOBILE_FPGA
Z
zhangyang 已提交
98
USE_OP_FPGA(fusion_conv_add_relu);
99 100
#endif

L
liuruilong 已提交
101
#endif