batch_norm.cpp 2.6 KB
Newer Older
1 2 3 4
/**
 * \file imperative/src/impl/ops/batch_norm.cpp
 * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
 *
5
 * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
6 7 8 9 10 11
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 */

12 13
#include "megbrain/imperative/ops/autogen.h"
#include "megbrain/opr/dnn/batch_norm.h"
14 15 16 17 18 19 20 21 22
#include "../op_trait.h"

namespace mgb {
namespace imperative {

namespace {

std::shared_ptr<OpDef> make_from_op_node(cg::OperatorNodeBase* node_) {
    auto* node = &node_->cast_final_safe<opr::BatchNorm>();
23
    return BatchNorm::make(node->param());
24 25 26 27 28 29 30 31 32 33 34
}

cg::OperatorNodeBase* apply_on_var_node(
        const OpDef& def,
        const VarNodeArray& inputs) {
    auto&& bn_opr = def.cast_final_safe<BatchNorm>();
    size_t nr_inp = inputs.size();
    mgb_assert(nr_inp == 3 ||nr_inp == 5,
              "BatchNorm expects 3 or 5 inputs; got %lu actually", nr_inp);
    if (nr_inp == 3) {
        return opr::BatchNorm::make(
35
            inputs[0], inputs[1], inputs[2], bn_opr.param())[0]
36 37 38
            .node()->owner_opr();
    } else {
        return opr::BatchNorm::make(
39
            inputs[0], inputs[1], inputs[2], inputs[3], inputs[4], bn_opr.param())[0]
40 41 42 43
            .node()->owner_opr();
    }
}

44
std::tuple<SmallVector<LogicalTensorDesc>, bool> infer_output_attrs_fallible(
45 46 47 48 49 50 51
        const OpDef& def,
        const SmallVector<LogicalTensorDesc>& inputs) {
    auto&& op_def = def.cast_final_safe<BatchNorm>();
    size_t nr_inp = inputs.size();
    mgb_assert(nr_inp == 3 ||nr_inp == 5,
              "BatchNorm expects 3 or 5 inputs; got %lu actually", nr_inp);
    // need running mean/variance
52
    bool need_stat = (nr_inp == 5) && op_def.fwd_mode == BatchNorm::FwdMode::TRAINING;
53 54 55 56
    size_t nr_out = need_stat? 5 : 3;
    SmallVector<LogicalTensorDesc> out_shapes(nr_out);
    auto&& i0 = inputs[0];
    auto&& i1 = inputs[1];
57 58
    // [running_mean, running_var,] save_mean, save_var
    for (size_t i = 0; i < nr_out-1; ++ i) {
59 60
        out_shapes[i] = {i1.layout, i1.comp_node};
    }
61
    // output tensor
62
    out_shapes[nr_out-1] = {i0.layout, i0.comp_node};
63
    return {out_shapes, out_shapes[nr_out-1].layout.ndim != 0};
64 65 66 67 68 69 70 71 72 73 74 75 76
}

OP_TRAIT_REG(BatchNorm, BatchNorm, opr::BatchNorm)
    .make_from_op_node(make_from_op_node)
    .apply_on_var_node(apply_on_var_node)
    .infer_output_attrs_fallible(infer_output_attrs_fallible)
    .fallback();
} // anonymous namespace

}  // namespace imperative
}  // namespace mgb

// vim: syntax=cpp.doxygen foldmethod=marker foldmarker=f{{{,f}}}