addn_benchmark.cc 2.6 KB
Newer Older
李寅 已提交
1 2 3 4 5 6 7 8 9 10 11
//
// Copyright (c) 2017 XiaoMi All rights reserved.
//

#include <string>
#include "mace/core/operator.h"
#include "mace/core/testing/test_benchmark.h"
#include "mace/ops/ops_test_util.h"

namespace mace {
template <DeviceType D, typename T>
L
Liangliang He 已提交
12
static void AddNBenchmark(int iters, int inputs, int n, int h, int w, int c) {
李寅 已提交
13 14 15
  mace::testing::StopTiming();

  OpsTestNet net;
L
Liangliang He 已提交
16 17
  // Add input data
  for (int i = 0; i < inputs; ++i) {
18
    net.AddRandomInput<D, float>(MakeString("Input", i).c_str(), {n, h, w, c});
李寅 已提交
19 20
  }

L
Liangliang He 已提交
21 22
  if (D == DeviceType::OPENCL) {
    for (int i = 0; i < inputs; ++i) {
23 24
      BufferToImage<D, T>(net, MakeString("Input", i).c_str(),
                          MakeString("InputImage", i).c_str(),
25
                          kernels::BufferType::IN_OUT_CHANNEL);
L
Liangliang He 已提交
26 27 28
    }
    OpDefBuilder op_def_builder("AddN", "AddNBM");
    for (int i = 0; i < inputs; ++i) {
29
      op_def_builder.Input(MakeString("InputImage", i).c_str());
L
Liangliang He 已提交
30
    }
L
Liangliang He 已提交
31
    op_def_builder.Output("OutputImage")
32 33
        .AddIntArg("T", static_cast<int>(DataTypeToEnum<T>::value))
        .Finalize(net.NewOperatorDef());
L
Liangliang He 已提交
34 35 36
  } else {
    OpDefBuilder op_def_builder("AddN", "AddNBM");
    for (int i = 0; i < inputs; ++i) {
37
      op_def_builder.Input(MakeString("Input", i).c_str());
L
Liangliang He 已提交
38
    }
L
Liangliang He 已提交
39
    op_def_builder.Output("Output")
40 41
        .AddIntArg("T", static_cast<int>(DataTypeToEnum<T>::value))
        .Finalize(net.NewOperatorDef());
李寅 已提交
42 43 44 45 46
  }

  // Warm-up
  for (int i = 0; i < 5; ++i) {
    net.RunOp(D);
L
Liangliang He 已提交
47
    net.Sync();
李寅 已提交
48 49 50
  }

  mace::testing::StartTiming();
L
Liangliang He 已提交
51
  while (iters--) {
李寅 已提交
52
    net.RunOp(D);
L
Liangliang He 已提交
53
    net.Sync();
李寅 已提交
54 55 56
  }
}

L
Liangliang He 已提交
57 58 59 60 61 62 63 64
#define BM_ADDN_MACRO(INPUTS, N, H, W, C, TYPE, DEVICE)                       \
  static void BM_ADDN_##INPUTS##_##N##_##H##_##W##_##C##_##TYPE##_##DEVICE(   \
      int iters) {                                                            \
    const int64_t tot = static_cast<int64_t>(iters) * INPUTS * N * H * W * C; \
    mace::testing::MaccProcessed(tot);                                        \
    mace::testing::BytesProcessed(tot *(sizeof(TYPE)));                       \
    AddNBenchmark<DEVICE, TYPE>(iters, INPUTS, N, H, W, C);                   \
  }                                                                           \
L
Liangliang He 已提交
65 66
  BENCHMARK(BM_ADDN_##INPUTS##_##N##_##H##_##W##_##C##_##TYPE##_##DEVICE)

L
Liangliang He 已提交
67 68
#define BM_ADDN(INPUTS, N, H, W, C)                 \
  BM_ADDN_MACRO(INPUTS, N, H, W, C, float, CPU);    \
69 70
  BM_ADDN_MACRO(INPUTS, N, H, W, C, float, OPENCL); \
  BM_ADDN_MACRO(INPUTS, N, H, W, C, half, OPENCL);
L
Liangliang He 已提交
71

72 73 74 75 76
BM_ADDN(2, 1, 256, 256, 32);
BM_ADDN(2, 1, 128, 128, 32);
BM_ADDN(4, 1, 128, 128, 3);
BM_ADDN(2, 1, 256, 256, 3);
BM_ADDN(2, 1, 512, 512, 3);
L
Liangliang He 已提交
77

78
}  // namespace mace