algo.cpp 3.4 KB
Newer Older
1 2 3 4
/**
 * \file dnn/src/cuda/convolution3d/forward/algo.cpp
 * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
 *
5
 * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 */

#include "./algo.h"
#include "src/cuda/utils.h"

using namespace megdnn;
using namespace cuda;

Convolution3DForwardImpl::AlgoPack::AlgoPack() {
    non_cudnn_algos.push_back(&chanwise);
    non_cudnn_algos.push_back(&inplace_matmul);
    non_cudnn_algos.push_back(&a1x1x1);

    all_algos.push_back(&chanwise);
24

25 26
    fill_cudnn_algos();
    for (auto &&i: cudnn) {
27
       all_algos.push_back(&i);
28 29
    }
    all_algos.push_back(&inplace_matmul);
30
    all_algos.push_back(&a1x1x1);
31
    all_algos.push_back(&group);
32 33 34 35

    for (auto&& algo : all_algos) {
        m_all_algos_map.emplace(algo->info().desc, algo);
    }
36 37
}

38 39
MEGDNN_DEF_GET_ALGO_FROM_DESC(Convolution3DForwardImpl)

40 41 42 43 44 45 46
Convolution3DForwardImpl::AlgoCUDNN*
Convolution3DForwardImpl::AlgoPack::cudnn_from_enum(
        cudnnConvolutionFwdAlgo_t algo) {
    for (auto &&i: cudnn) {
        if (i.cudnn_enum() == algo)
            return &i;
    }
M
Megvii Engine Team 已提交
47 48
    megdnn_throw(ssprintf("can not find cudnn fwd algorithm %d",
                          static_cast<int>(algo)));
49 50 51 52 53
}

Convolution3DForwardImpl::AlgoPack Convolution3DForwardImpl::sm_algo_pack;

Convolution3DForwardImpl::AlgoBase::SizeArgs::SizeArgs(
54 55 56 57
        const Convolution3DForwardImpl* o, const TensorLayout& src,
        const TensorLayout& filter, const TensorLayout& dst)
        : SizeArgs(o, src, filter,
                   o->make_canonized_filter_meta(src.ndim, filter), dst) {}
58 59

Convolution3DForwardImpl::AlgoBase::SizeArgs::SizeArgs(
60 61 62 63 64 65 66 67 68 69
        const Convolution3DForwardImpl* o, const TensorLayout& src,
        const TensorLayout& filter, const CanonizedFilterMeta& filter_meta,
        const TensorLayout& dst)
        : ForwardSizeArgs{concrete_handle(o->handle()),
                          &src,
                          &filter,
                          filter_meta,
                          &dst,
                          o->param().data_type},
          opr{o} {}
70 71

Convolution3DForwardImpl::AlgoBase::ExecArgs::ExecArgs(
72
        const Convolution3DForwardImpl *opr,
73 74 75 76 77 78 79 80 81 82 83 84 85
        _megdnn_tensor_in src,
        _megdnn_tensor_in filter,
        _megdnn_tensor_out dst,
        _megdnn_workspace workspace):
    SizeArgs(opr, src.layout, filter.layout, dst.layout),
    src_tensor{&src}, filter_tensor{&filter}, dst_tensor{&dst},
    workspace{workspace}
{
}

std::string Convolution3DForwardImpl::AlgoBase::SizeArgs::to_string() const {
    auto &&fm = filter_meta;
    MEGDNN_MARK_USED_VAR(fm);
M
Megvii Engine Team 已提交
86 87 88 89 90 91 92 93 94 95
    return ssprintf(
            "src=%s, filter=%u{%u,%u,%u,%u,%u}, dst=%s, "
            "pad=%ux%ux%u, stride=%ux%ux%u, dilate=%ux%ux%u, xcorr=%d, "
            "dtype=%s,%s",
            src_layout->to_string().c_str(), fm.group, fm.ocpg, fm.icpg,
            fm.spatial[0], fm.spatial[1], fm.spatial[2],
            dst_layout->to_string().c_str(), fm.padding[0], fm.padding[1],
            fm.padding[2], fm.stride[0], fm.stride[1], fm.stride[2],
            fm.dilation[0], fm.dilation[1], fm.dilation[2], !fm.should_flip,
            src_layout->dtype.name(), dst_layout->dtype.name());
96 97 98
}

// vim: syntax=cpp.doxygen