Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
慢慢CG
Mace
提交
12139efe
Mace
项目概览
慢慢CG
/
Mace
与 Fork 源项目一致
Fork自
Xiaomi / Mace
通知
1
Star
0
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
Mace
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
提交
12139efe
编写于
9月 11, 2018
作者:
Y
yejianwu
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
update memory optimize for expand_dims, add reverse benchmark
上级
f3de19de
变更
7
隐藏空白更改
内联
并排
Showing
7 changed file
with
93 addition
and
15 deletion
+93
-15
mace/kernels/expand_dims.h
mace/kernels/expand_dims.h
+6
-8
mace/kernels/reverse.h
mace/kernels/reverse.h
+3
-1
mace/ops/expand_dims.cc
mace/ops/expand_dims.cc
+5
-0
mace/ops/expand_dims.h
mace/ops/expand_dims.h
+3
-3
mace/ops/reverse.h
mace/ops/reverse.h
+2
-2
mace/ops/reverse_benchmark.cc
mace/ops/reverse_benchmark.cc
+73
-0
mace/python/tools/memory_optimizer.py
mace/python/tools/memory_optimizer.py
+1
-1
未找到文件。
mace/kernels/expand_dims.h
浏览文件 @
12139efe
...
...
@@ -19,6 +19,7 @@
#include "mace/core/future.h"
#include "mace/core/tensor.h"
#include "mace/kernels/kernel.h"
#ifdef MACE_ENABLE_OPENCL
#include "mace/core/runtime/opencl/cl2_header.h"
...
...
@@ -27,18 +28,13 @@
namespace
mace
{
namespace
kernels
{
struct
ExpandDimsBase
{
explicit
ExpandDimsBase
(
int
axis
)
:
axis_
(
axis
)
{}
int
axis_
;
};
template
<
DeviceType
D
,
typename
T
>
struct
ExpandDimsFunctor
;
template
<
typename
T
>
struct
ExpandDimsFunctor
<
DeviceType
::
CPU
,
T
>
:
ExpandDimsBase
{
explicit
ExpandDimsFunctor
(
int
axis
)
:
ExpandDimsBase
(
axis
)
{}
struct
ExpandDimsFunctor
<
DeviceType
::
CPU
,
T
>
:
OpKernel
{
explicit
ExpandDimsFunctor
(
OpKernelContext
*
context
,
int
axis
)
:
OpKernel
(
context
),
axis_
(
axis
)
{}
MaceStatus
operator
()(
const
Tensor
*
input
,
Tensor
*
output
,
...
...
@@ -64,6 +60,8 @@ struct ExpandDimsFunctor<DeviceType::CPU, T> : ExpandDimsBase {
return
MACE_SUCCESS
;
}
int
axis_
;
};
}
// namespace kernels
...
...
mace/kernels/reverse.h
浏览文件 @
12139efe
...
...
@@ -20,6 +20,7 @@
#include "mace/core/future.h"
#include "mace/core/tensor.h"
#include "mace/kernels/kernel.h"
#ifdef MACE_ENABLE_OPENCL
#include "mace/core/runtime/opencl/cl2_header.h"
...
...
@@ -32,7 +33,8 @@ template <DeviceType D, typename T>
struct
ReverseFunctor
;
template
<
typename
T
>
struct
ReverseFunctor
<
DeviceType
::
CPU
,
T
>
{
struct
ReverseFunctor
<
DeviceType
::
CPU
,
T
>
:
OpKernel
{
explicit
ReverseFunctor
(
OpKernelContext
*
context
)
:
OpKernel
(
context
)
{}
MaceStatus
operator
()(
const
Tensor
*
input
,
const
Tensor
*
axis
,
Tensor
*
output
,
...
...
mace/ops/expand_dims.cc
浏览文件 @
12139efe
...
...
@@ -28,6 +28,11 @@ void Register_ExpandDims(OperatorRegistryBase *op_registry) {
.
TypeConstraint
<
int32_t
>
(
"T"
)
.
Build
(),
ExpandDimsOp
<
DeviceType
::
CPU
,
int32_t
>
);
MACE_REGISTER_OPERATOR
(
op_registry
,
OpKeyBuilder
(
"ExpandDims"
)
.
Device
(
DeviceType
::
CPU
)
.
TypeConstraint
<
uint8_t
>
(
"T"
)
.
Build
(),
ExpandDimsOp
<
DeviceType
::
CPU
,
uint8_t
>
);
}
}
// namespace ops
...
...
mace/ops/expand_dims.h
浏览文件 @
12139efe
...
...
@@ -26,9 +26,9 @@ namespace ops {
template
<
DeviceType
D
,
typename
T
>
class
ExpandDimsOp
:
public
Operator
<
D
,
T
>
{
public:
ExpandDimsOp
(
const
OperatorDef
&
op_def
,
Workspace
*
ws
)
:
Operator
<
D
,
T
>
(
op_def
,
ws
),
functor_
(
OperatorBase
::
GetOptionalArg
<
int
>
(
"axis"
,
0
))
{}
ExpandDimsOp
(
const
OperatorDef
&
op_def
,
OpKernelContext
*
context
)
:
Operator
<
D
,
T
>
(
op_def
,
context
),
functor_
(
context
,
OperatorBase
::
GetOptionalArg
<
int
>
(
"axis"
,
0
))
{}
MaceStatus
Run
(
StatsFuture
*
future
)
override
{
const
Tensor
*
input
=
this
->
Input
(
INPUT
);
...
...
mace/ops/reverse.h
浏览文件 @
12139efe
...
...
@@ -26,8 +26,8 @@ namespace ops {
template
<
DeviceType
D
,
class
T
>
class
ReverseOp
:
public
Operator
<
D
,
T
>
{
public:
ReverseOp
(
const
OperatorDef
&
operator_def
,
Workspace
*
ws
)
:
Operator
<
D
,
T
>
(
operator_def
,
ws
)
{}
ReverseOp
(
const
OperatorDef
&
operator_def
,
OpKernelContext
*
context
)
:
Operator
<
D
,
T
>
(
operator_def
,
context
),
functor_
(
context
)
{}
MaceStatus
Run
(
StatsFuture
*
future
)
override
{
const
Tensor
*
input
=
this
->
Input
(
INPUT
);
...
...
mace/ops/reverse_benchmark.cc
0 → 100644
浏览文件 @
12139efe
// Copyright 2018 Xiaomi, Inc. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "mace/core/operator.h"
#include "mace/core/runtime/opencl/opencl_runtime.h"
#include "mace/core/testing/test_benchmark.h"
#include "mace/ops/ops_test_util.h"
namespace
mace
{
namespace
ops
{
namespace
test
{
namespace
{
template
<
DeviceType
D
,
typename
T
>
void
Reverse
(
int
iters
,
int
batch
,
int
channels
,
int
height
,
int
width
)
{
mace
::
testing
::
StopTiming
();
OpsTestNet
net
;
net
.
AddRandomInput
<
D
,
T
>
(
"Input"
,
{
batch
,
channels
,
height
,
width
});
net
.
AddRandomInput
<
D
,
int32_t
>
(
"Axis"
,
{
1
});
OpDefBuilder
(
"Reverse"
,
"ReverseOpTest"
)
.
Input
(
"Input"
)
.
Input
(
"Axis"
)
.
Output
(
"Output"
)
.
Finalize
(
net
.
NewOperatorDef
());
// Warm-up
for
(
int
i
=
0
;
i
<
5
;
++
i
)
{
net
.
RunOp
(
D
);
}
net
.
Sync
();
mace
::
testing
::
StartTiming
();
while
(
iters
--
)
{
net
.
RunOp
(
D
);
}
net
.
Sync
();
}
}
// namespace
#define MACE_BM_REVERSE_MACRO(N, C, H, W, TYPE, DEVICE) \
static void MACE_BM_REVERSE_##N##_##C##_##H##_##W##_##TYPE##_##DEVICE( \
int iters) { \
const int64_t macc = \
static_cast<int64_t>(iters) * N * C * H * W; \
const int64_t tot = static_cast<int64_t>(iters) * N * C * H * W; \
mace::testing::MaccProcessed(macc); \
mace::testing::BytesProcessed(tot *(sizeof(TYPE))); \
Reverse<DEVICE, TYPE>(iters, N, C, H, W); \
} \
MACE_BENCHMARK(MACE_BM_REVERSE_##N##_##C##_##H##_##W##_##TYPE##_##DEVICE)
#define MACE_BM_REVERSE(N, C, H, W) \
MACE_BM_REVERSE_MACRO(N, C, H, W, float, CPU);
MACE_BM_REVERSE
(
1
,
1
,
99
,
256
);
MACE_BM_REVERSE
(
1
,
30
,
99
,
256
);
MACE_BM_REVERSE
(
1
,
50
,
99
,
256
);
}
// namespace test
}
// namespace ops
}
// namespace mace
mace/python/tools/memory_optimizer.py
浏览文件 @
12139efe
...
...
@@ -124,7 +124,7 @@ class MemoryOptimizer(object):
@
staticmethod
def
is_memory_reuse_op
(
op
):
return
op
.
type
==
'Reshape'
or
op
.
type
==
'Identity'
\
or
op
.
type
==
'Squeeze'
or
op
.
type
==
'Squeeze'
or
op
.
type
==
'ExpandDims'
def
optimize
(
self
):
for
op
in
self
.
net_def
.
op
:
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录