addn_benchmark.cc 3.3 KB
Newer Older
L
Liangliang He 已提交
1
// Copyright 2018 Xiaomi, Inc.  All rights reserved.
李寅 已提交
2
//
L
Liangliang He 已提交
3 4 5
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
李寅 已提交
6
//
L
Liangliang He 已提交
7 8 9 10 11 12 13
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
李寅 已提交
14 15

#include <string>
L
liutuo 已提交
16

李寅 已提交
17 18 19 20 21
#include "mace/core/operator.h"
#include "mace/core/testing/test_benchmark.h"
#include "mace/ops/ops_test_util.h"

namespace mace {
L
liutuo 已提交
22 23 24
namespace ops {
namespace test {

25
namespace {
李寅 已提交
26
template <DeviceType D, typename T>
27
void AddNBenchmark(int iters, int inputs, int n, int h, int w, int c) {
李寅 已提交
28 29 30
  mace::testing::StopTiming();

  OpsTestNet net;
L
Liangliang He 已提交
31 32
  // Add input data
  for (int i = 0; i < inputs; ++i) {
33
    net.AddRandomInput<D, float>(MakeString("Input", i).c_str(), {n, h, w, c});
李寅 已提交
34 35
  }

L
Liangliang He 已提交
36 37
  if (D == DeviceType::OPENCL) {
    for (int i = 0; i < inputs; ++i) {
Y
yejianwu 已提交
38
      BufferToImage<D, T>(&net, MakeString("Input", i).c_str(),
39
                          MakeString("InputImage", i).c_str(),
40
                          kernels::BufferType::IN_OUT_CHANNEL);
L
Liangliang He 已提交
41 42 43
    }
    OpDefBuilder op_def_builder("AddN", "AddNBM");
    for (int i = 0; i < inputs; ++i) {
44
      op_def_builder.Input(MakeString("InputImage", i).c_str());
L
Liangliang He 已提交
45
    }
L
Liangliang He 已提交
46
    op_def_builder.Output("OutputImage")
47 48
        .AddIntArg("T", static_cast<int>(DataTypeToEnum<T>::value))
        .Finalize(net.NewOperatorDef());
L
Liangliang He 已提交
49 50 51
  } else {
    OpDefBuilder op_def_builder("AddN", "AddNBM");
    for (int i = 0; i < inputs; ++i) {
52
      op_def_builder.Input(MakeString("Input", i).c_str());
L
Liangliang He 已提交
53
    }
L
Liangliang He 已提交
54
    op_def_builder.Output("Output")
55 56
        .AddIntArg("T", static_cast<int>(DataTypeToEnum<T>::value))
        .Finalize(net.NewOperatorDef());
李寅 已提交
57 58 59 60 61
  }

  // Warm-up
  for (int i = 0; i < 5; ++i) {
    net.RunOp(D);
L
Liangliang He 已提交
62
    net.Sync();
李寅 已提交
63 64 65
  }

  mace::testing::StartTiming();
L
Liangliang He 已提交
66
  while (iters--) {
李寅 已提交
67
    net.RunOp(D);
L
Liangliang He 已提交
68
    net.Sync();
李寅 已提交
69 70
  }
}
71
}  // namespace
李寅 已提交
72

L
Liangliang He 已提交
73 74 75 76 77 78 79 80
#define BM_ADDN_MACRO(INPUTS, N, H, W, C, TYPE, DEVICE)                       \
  static void BM_ADDN_##INPUTS##_##N##_##H##_##W##_##C##_##TYPE##_##DEVICE(   \
      int iters) {                                                            \
    const int64_t tot = static_cast<int64_t>(iters) * INPUTS * N * H * W * C; \
    mace::testing::MaccProcessed(tot);                                        \
    mace::testing::BytesProcessed(tot *(sizeof(TYPE)));                       \
    AddNBenchmark<DEVICE, TYPE>(iters, INPUTS, N, H, W, C);                   \
  }                                                                           \
L
Liangliang He 已提交
81 82
  BENCHMARK(BM_ADDN_##INPUTS##_##N##_##H##_##W##_##C##_##TYPE##_##DEVICE)

L
Liangliang He 已提交
83 84
#define BM_ADDN(INPUTS, N, H, W, C)                 \
  BM_ADDN_MACRO(INPUTS, N, H, W, C, float, CPU);    \
85 86
  BM_ADDN_MACRO(INPUTS, N, H, W, C, float, OPENCL); \
  BM_ADDN_MACRO(INPUTS, N, H, W, C, half, OPENCL);
L
Liangliang He 已提交
87

88 89 90 91 92
BM_ADDN(2, 1, 256, 256, 32);
BM_ADDN(2, 1, 128, 128, 32);
BM_ADDN(4, 1, 128, 128, 3);
BM_ADDN(2, 1, 256, 256, 3);
BM_ADDN(2, 1, 512, 512, 3);
L
Liangliang He 已提交
93

L
liutuo 已提交
94 95
}  // namespace test
}  // namespace ops
96
}  // namespace mace