addn_benchmark.cc 2.6 KB
Newer Older
李寅 已提交
1 2 3 4 5 6 7 8 9 10 11
//
// Copyright (c) 2017 XiaoMi All rights reserved.
//

#include <string>
#include "mace/core/operator.h"
#include "mace/core/testing/test_benchmark.h"
#include "mace/ops/ops_test_util.h"

namespace mace {
template <DeviceType D, typename T>
L
Liangliang He 已提交
12
static void AddNBenchmark(int iters, int inputs, int n, int h, int w, int c) {
李寅 已提交
13 14 15
  mace::testing::StopTiming();

  OpsTestNet net;
L
Liangliang He 已提交
16 17
  // Add input data
  for (int i = 0; i < inputs; ++i) {
18
    net.AddRandomInput<D, float>(MakeString("Input", i).c_str(),
19
                                 {n, h, w, c});
李寅 已提交
20 21
  }

L
Liangliang He 已提交
22 23
  if (D == DeviceType::OPENCL) {
    for (int i = 0; i < inputs; ++i) {
24 25
      BufferToImage<D, T>(net, MakeString("Input", i).c_str(),
                          MakeString("InputImage", i).c_str(),
26
                          kernels::BufferType::IN_OUT_CHANNEL);
L
Liangliang He 已提交
27 28 29
    }
    OpDefBuilder op_def_builder("AddN", "AddNBM");
    for (int i = 0; i < inputs; ++i) {
30
      op_def_builder.Input(MakeString("InputImage", i).c_str());
L
Liangliang He 已提交
31
    }
L
Liangliang He 已提交
32
    op_def_builder.Output("OutputImage")
33 34
        .AddIntArg("T", static_cast<int>(DataTypeToEnum<T>::value))
        .Finalize(net.NewOperatorDef());
L
Liangliang He 已提交
35 36 37
  } else {
    OpDefBuilder op_def_builder("AddN", "AddNBM");
    for (int i = 0; i < inputs; ++i) {
38
      op_def_builder.Input(MakeString("Input", i).c_str());
L
Liangliang He 已提交
39
    }
L
Liangliang He 已提交
40
    op_def_builder.Output("Output")
41 42
        .AddIntArg("T", static_cast<int>(DataTypeToEnum<T>::value))
        .Finalize(net.NewOperatorDef());
李寅 已提交
43 44 45 46 47
  }

  // Warm-up
  for (int i = 0; i < 5; ++i) {
    net.RunOp(D);
L
Liangliang He 已提交
48
    net.Sync();
李寅 已提交
49 50 51
  }

  mace::testing::StartTiming();
L
Liangliang He 已提交
52
  while (iters--) {
李寅 已提交
53
    net.RunOp(D);
L
Liangliang He 已提交
54
    net.Sync();
李寅 已提交
55 56 57
  }
}

L
Liangliang He 已提交
58 59 60 61 62 63 64 65
#define BM_ADDN_MACRO(INPUTS, N, H, W, C, TYPE, DEVICE)                       \
  static void BM_ADDN_##INPUTS##_##N##_##H##_##W##_##C##_##TYPE##_##DEVICE(   \
      int iters) {                                                            \
    const int64_t tot = static_cast<int64_t>(iters) * INPUTS * N * H * W * C; \
    mace::testing::MaccProcessed(tot);                                        \
    mace::testing::BytesProcessed(tot *(sizeof(TYPE)));                       \
    AddNBenchmark<DEVICE, TYPE>(iters, INPUTS, N, H, W, C);                   \
  }                                                                           \
L
Liangliang He 已提交
66 67
  BENCHMARK(BM_ADDN_##INPUTS##_##N##_##H##_##W##_##C##_##TYPE##_##DEVICE)

L
Liangliang He 已提交
68 69
#define BM_ADDN(INPUTS, N, H, W, C)                 \
  BM_ADDN_MACRO(INPUTS, N, H, W, C, float, CPU);    \
70 71
  BM_ADDN_MACRO(INPUTS, N, H, W, C, float, OPENCL); \
  BM_ADDN_MACRO(INPUTS, N, H, W, C, half, OPENCL);
L
Liangliang He 已提交
72

73 74 75 76 77
BM_ADDN(2, 1, 256, 256, 32);
BM_ADDN(2, 1, 128, 128, 32);
BM_ADDN(4, 1, 128, 128, 3);
BM_ADDN(2, 1, 256, 256, 3);
BM_ADDN(2, 1, 512, 512, 3);
L
Liangliang He 已提交
78

79
}  // namespace mace