Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle-Lite
提交
7c26bc2e
P
Paddle-Lite
项目概览
PaddlePaddle
/
Paddle-Lite
通知
332
Star
4
Fork
1
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
271
列表
看板
标记
里程碑
合并请求
78
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle-Lite
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
271
Issue
271
列表
看板
标记
里程碑
合并请求
78
合并请求
78
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
7c26bc2e
编写于
4月 14, 2020
作者:
Z
zhangshijin
提交者:
GitHub
4月 14, 2020
浏览文件
操作
浏览文件
下载
差异文件
Merge pull request
#55
from Cambricon/Deviceinfo2Backends
move sth from device_info to backends/mlu
上级
0b2dad2b
27d55e61
变更
8
隐藏空白更改
内联
并排
Showing
8 changed file
with
79 addition
and
84 deletion
+79
-84
lite/api/cxx_api_impl.cc
lite/api/cxx_api_impl.cc
+6
-6
lite/backends/mlu/target_wrapper.cc
lite/backends/mlu/target_wrapper.cc
+44
-0
lite/backends/mlu/target_wrapper.h
lite/backends/mlu/target_wrapper.h
+20
-0
lite/core/context.h
lite/core/context.h
+4
-2
lite/core/device_info.cc
lite/core/device_info.cc
+0
-48
lite/core/device_info.h
lite/core/device_info.h
+0
-23
lite/core/mir/mlu_postprocess_pass.cc
lite/core/mir/mlu_postprocess_pass.cc
+2
-2
lite/kernels/mlu/bridges/conv_op.cc
lite/kernels/mlu/bridges/conv_op.cc
+3
-3
未找到文件。
lite/api/cxx_api_impl.cc
浏览文件 @
7c26bc2e
...
@@ -36,12 +36,12 @@ void CxxPaddleApiImpl::Init(const lite_api::CxxConfig &config) {
...
@@ -36,12 +36,12 @@ void CxxPaddleApiImpl::Init(const lite_api::CxxConfig &config) {
#endif
#endif
#ifdef LITE_WITH_MLU
#ifdef LITE_WITH_MLU
Env
<
TARGET
(
kMLU
)
>::
Init
();
Env
<
TARGET
(
kMLU
)
>::
Init
();
lite
::
DeviceInfo
::
Global
().
SetMLURunMode
(
config
.
mlu_core_version
(),
lite
::
TargetWrapperMlu
::
SetMLURunMode
(
config
.
mlu_core_version
(),
config
.
mlu_core_number
(),
config
.
mlu_core_number
(),
config
.
mlu_use_first_conv
(),
config
.
mlu_use_first_conv
(),
config
.
mlu_first_conv_mean
(),
config
.
mlu_first_conv_mean
(),
config
.
mlu_first_conv_std
(),
config
.
mlu_first_conv_std
(),
config
.
mlu_input_layout
());
config
.
mlu_input_layout
());
#endif // LITE_WITH_MLU
#endif // LITE_WITH_MLU
auto
places
=
config
.
valid_places
();
auto
places
=
config
.
valid_places
();
std
::
vector
<
std
::
string
>
passes
{};
std
::
vector
<
std
::
string
>
passes
{};
...
...
lite/backends/mlu/target_wrapper.cc
浏览文件 @
7c26bc2e
...
@@ -36,6 +36,13 @@ void cnrtMemcpyDtoH(void* dst, const void* src, size_t size) {
...
@@ -36,6 +36,13 @@ void cnrtMemcpyDtoH(void* dst, const void* src, size_t size) {
}
// namespace mlu
}
// namespace mlu
thread_local
cnmlCoreVersion_t
TargetWrapperMlu
::
mlu_core_version_
{
CNML_MLU270
};
thread_local
int
TargetWrapperMlu
::
mlu_core_number_
{
1
};
thread_local
bool
TargetWrapperMlu
::
use_first_conv_
{
false
};
thread_local
std
::
vector
<
float
>
TargetWrapperMlu
::
mean_vec_
;
thread_local
std
::
vector
<
float
>
TargetWrapperMlu
::
std_vec_
;
thread_local
DataLayoutType
TargetWrapperMlu
::
input_layout_
{
DATALAYOUT
(
kNCHW
)};
size_t
TargetWrapperMlu
::
num_devices
()
{
size_t
TargetWrapperMlu
::
num_devices
()
{
uint32_t
dev_count
=
0
;
uint32_t
dev_count
=
0
;
CNRT_CALL
(
cnrtGetDeviceCount
(
&
dev_count
))
<<
" cnrt get device count failed"
;
CNRT_CALL
(
cnrtGetDeviceCount
(
&
dev_count
))
<<
" cnrt get device count failed"
;
...
@@ -77,6 +84,43 @@ void TargetWrapperMlu::MemcpySync(void* dst,
...
@@ -77,6 +84,43 @@ void TargetWrapperMlu::MemcpySync(void* dst,
LOG
(
FATAL
)
<<
"Unsupported IoDirection"
<<
static_cast
<
int
>
(
dir
);
LOG
(
FATAL
)
<<
"Unsupported IoDirection"
<<
static_cast
<
int
>
(
dir
);
}
}
}
}
void
TargetWrapperMlu
::
SetMLURunMode
(
lite_api
::
MLUCoreVersion
core_version
,
int
core_number
,
bool
use_first_conv
,
const
std
::
vector
<
float
>&
mean_vec
,
const
std
::
vector
<
float
>&
std_vec
,
DataLayoutType
input_layout
)
{
switch
(
core_version
)
{
case
(
lite_api
::
MLUCoreVersion
::
MLU_220
):
mlu_core_version_
=
CNML_MLU220
;
break
;
case
(
lite_api
::
MLUCoreVersion
::
MLU_270
):
mlu_core_version_
=
CNML_MLU270
;
break
;
default:
mlu_core_version_
=
CNML_MLU270
;
break
;
}
mlu_core_number_
=
core_number
;
use_first_conv_
=
use_first_conv
;
mean_vec_
=
mean_vec
;
std_vec_
=
std_vec
;
input_layout_
=
input_layout
;
}
cnmlCoreVersion_t
TargetWrapperMlu
::
MLUCoreVersion
()
{
return
mlu_core_version_
;
}
int
TargetWrapperMlu
::
MLUCoreNumber
()
{
return
mlu_core_number_
;
}
bool
TargetWrapperMlu
::
UseFirstConv
()
{
return
use_first_conv_
;
}
const
std
::
vector
<
float
>&
TargetWrapperMlu
::
MeanVec
()
{
return
mean_vec_
;
}
const
std
::
vector
<
float
>&
TargetWrapperMlu
::
StdVec
()
{
return
std_vec_
;
}
DataLayoutType
TargetWrapperMlu
::
InputLayout
()
{
return
input_layout_
;
}
// void TargetWrapperMlu::MemcpyAsync(void* dst,
// void TargetWrapperMlu::MemcpyAsync(void* dst,
// const void* src,
// const void* src,
...
...
lite/backends/mlu/target_wrapper.h
浏览文件 @
7c26bc2e
...
@@ -13,6 +13,7 @@
...
@@ -13,6 +13,7 @@
// limitations under the License.
// limitations under the License.
#pragma once
#pragma once
#include <vector>
#include "lite/backends/mlu/mlu_utils.h"
#include "lite/backends/mlu/mlu_utils.h"
#include "lite/core/target_wrapper.h"
#include "lite/core/target_wrapper.h"
...
@@ -43,11 +44,30 @@ class TargetWrapper<TARGET(kMLU)> {
...
@@ -43,11 +44,30 @@ class TargetWrapper<TARGET(kMLU)> {
const
void
*
src
,
const
void
*
src
,
size_t
size
,
size_t
size
,
IoDirection
dir
);
IoDirection
dir
);
static
void
SetMLURunMode
(
lite_api
::
MLUCoreVersion
core_version
,
int
core_number
,
bool
use_first_conv
,
const
std
::
vector
<
float
>&
mean_vec
,
const
std
::
vector
<
float
>&
std_vec
,
DataLayoutType
input_layout
);
static
cnmlCoreVersion_t
MLUCoreVersion
();
static
int
MLUCoreNumber
();
static
bool
UseFirstConv
();
static
const
std
::
vector
<
float
>&
MeanVec
();
static
const
std
::
vector
<
float
>&
StdVec
();
static
DataLayoutType
InputLayout
();
// static void MemcpyAsync(void* dst,
// static void MemcpyAsync(void* dst,
// const void* src,
// const void* src,
// size_t size,
// size_t size,
// IoDirection dir,
// IoDirection dir,
// const queue_t& queue);
// const queue_t& queue);
private:
static
thread_local
cnmlCoreVersion_t
mlu_core_version_
;
static
thread_local
int
mlu_core_number_
;
static
thread_local
bool
use_first_conv_
;
static
thread_local
std
::
vector
<
float
>
mean_vec_
;
static
thread_local
std
::
vector
<
float
>
std_vec_
;
static
thread_local
DataLayoutType
input_layout_
;
};
};
}
// namespace lite
}
// namespace lite
...
...
lite/core/context.h
浏览文件 @
7c26bc2e
...
@@ -227,10 +227,12 @@ class Context<TargetType::kMLU> {
...
@@ -227,10 +227,12 @@ class Context<TargetType::kMLU> {
void
SetIoQueue
(
cnrtQueue_t
queue
)
{
io_queue_
=
queue
;
}
void
SetIoQueue
(
cnrtQueue_t
queue
)
{
io_queue_
=
queue
;
}
cnmlCoreVersion_t
MLUCoreVersion
()
{
cnmlCoreVersion_t
MLUCoreVersion
()
{
return
DeviceInfo
::
Global
().
MLUCoreVersion
();
return
paddle
::
lite
::
TargetWrapperMlu
::
MLUCoreVersion
();
}
}
int
MLUCoreNumber
()
{
return
DeviceInfo
::
Global
().
MLUCoreNumber
();
}
int
MLUCoreNumber
()
{
return
paddle
::
lite
::
TargetWrapperMlu
::
MLUCoreNumber
();
}
u32_t
affinity
()
{
return
affinity_
;
}
u32_t
affinity
()
{
return
affinity_
;
}
...
...
lite/core/device_info.cc
浏览文件 @
7c26bc2e
...
@@ -66,15 +66,6 @@ thread_local std::vector<int> DeviceInfo::active_ids_;
...
@@ -66,15 +66,6 @@ thread_local std::vector<int> DeviceInfo::active_ids_;
thread_local
TensorLite
DeviceInfo
::
workspace_
;
thread_local
TensorLite
DeviceInfo
::
workspace_
;
thread_local
int64_t
DeviceInfo
::
count_
=
0
;
thread_local
int64_t
DeviceInfo
::
count_
=
0
;
#ifdef LITE_WITH_MLU
thread_local
cnmlCoreVersion_t
DeviceInfo
::
mlu_core_version_
{
CNML_MLU270
};
thread_local
int
DeviceInfo
::
mlu_core_number_
{
1
};
thread_local
bool
DeviceInfo
::
use_first_conv_
{
false
};
thread_local
std
::
vector
<
float
>
DeviceInfo
::
mean_vec_
;
thread_local
std
::
vector
<
float
>
DeviceInfo
::
std_vec_
;
thread_local
DataLayoutType
DeviceInfo
::
input_layout_
{
DATALAYOUT
(
kNCHW
)};
#endif
#ifdef TARGET_IOS
#ifdef TARGET_IOS
const
int
DEFAULT_L1_CACHE_SIZE
=
64
*
1024
;
const
int
DEFAULT_L1_CACHE_SIZE
=
64
*
1024
;
const
int
DEFAULT_L2_CACHE_SIZE
=
2048
*
1024
;
const
int
DEFAULT_L2_CACHE_SIZE
=
2048
*
1024
;
...
@@ -1089,45 +1080,6 @@ int DeviceInfo::Setup() {
...
@@ -1089,45 +1080,6 @@ int DeviceInfo::Setup() {
return
0
;
return
0
;
}
}
#ifdef LITE_WITH_MLU
void
DeviceInfo
::
SetMLURunMode
(
lite_api
::
MLUCoreVersion
core_version
,
int
core_number
,
bool
use_first_conv
,
const
std
::
vector
<
float
>&
mean_vec
,
const
std
::
vector
<
float
>&
std_vec
,
DataLayoutType
input_layout
)
{
switch
(
core_version
)
{
case
(
lite_api
::
MLUCoreVersion
::
MLU_220
):
mlu_core_version_
=
CNML_MLU220
;
break
;
case
(
lite_api
::
MLUCoreVersion
::
MLU_270
):
mlu_core_version_
=
CNML_MLU270
;
break
;
default:
mlu_core_version_
=
CNML_MLU270
;
break
;
}
mlu_core_number_
=
core_number
;
use_first_conv_
=
use_first_conv
;
mean_vec_
=
mean_vec
;
std_vec_
=
std_vec
;
input_layout_
=
input_layout
;
}
cnmlCoreVersion_t
DeviceInfo
::
MLUCoreVersion
()
{
return
mlu_core_version_
;
}
int
DeviceInfo
::
MLUCoreNumber
()
{
return
mlu_core_number_
;
}
bool
DeviceInfo
::
UseFirstConv
()
{
return
use_first_conv_
;
}
const
std
::
vector
<
float
>&
DeviceInfo
::
MeanVec
()
const
{
return
mean_vec_
;
}
const
std
::
vector
<
float
>&
DeviceInfo
::
StdVec
()
const
{
return
std_vec_
;
}
DataLayoutType
DeviceInfo
::
InputLayout
()
const
{
return
input_layout_
;
}
#endif // LITE_WITH_MLU
void
DeviceInfo
::
SetRunMode
(
lite_api
::
PowerMode
mode
,
int
thread_num
)
{
void
DeviceInfo
::
SetRunMode
(
lite_api
::
PowerMode
mode
,
int
thread_num
)
{
#ifdef ARM_WITH_OMP
#ifdef ARM_WITH_OMP
thread_num
=
std
::
min
(
thread_num
,
core_num_
);
thread_num
=
std
::
min
(
thread_num
,
core_num_
);
...
...
lite/core/device_info.h
浏览文件 @
7c26bc2e
...
@@ -55,20 +55,6 @@ class DeviceInfo {
...
@@ -55,20 +55,6 @@ class DeviceInfo {
int
Setup
();
int
Setup
();
void
SetRunMode
(
lite_api
::
PowerMode
mode
,
int
thread_num
);
void
SetRunMode
(
lite_api
::
PowerMode
mode
,
int
thread_num
);
#ifdef LITE_WITH_MLU
void
SetMLURunMode
(
lite_api
::
MLUCoreVersion
core_version
,
int
core_number
,
bool
use_first_conv
,
const
std
::
vector
<
float
>&
mean_vec
,
const
std
::
vector
<
float
>&
std_vec
,
DataLayoutType
input_layout
);
cnmlCoreVersion_t
MLUCoreVersion
();
int
MLUCoreNumber
();
bool
UseFirstConv
();
const
std
::
vector
<
float
>&
MeanVec
()
const
;
const
std
::
vector
<
float
>&
StdVec
()
const
;
DataLayoutType
InputLayout
()
const
;
#endif
void
SetCache
(
int
l1size
,
int
l2size
,
int
l3size
);
void
SetCache
(
int
l1size
,
int
l2size
,
int
l3size
);
void
SetArch
(
ARMArch
arch
)
{
arch_
=
arch
;
}
void
SetArch
(
ARMArch
arch
)
{
arch_
=
arch
;
}
...
@@ -120,15 +106,6 @@ class DeviceInfo {
...
@@ -120,15 +106,6 @@ class DeviceInfo {
static
thread_local
TensorLite
workspace_
;
static
thread_local
TensorLite
workspace_
;
static
thread_local
int64_t
count_
;
static
thread_local
int64_t
count_
;
#ifdef LITE_WITH_MLU
static
thread_local
cnmlCoreVersion_t
mlu_core_version_
;
static
thread_local
int
mlu_core_number_
;
static
thread_local
bool
use_first_conv_
;
static
thread_local
std
::
vector
<
float
>
mean_vec_
;
static
thread_local
std
::
vector
<
float
>
std_vec_
;
static
thread_local
DataLayoutType
input_layout_
;
#endif
void
SetDotInfo
(
int
argc
,
...);
void
SetDotInfo
(
int
argc
,
...);
void
SetFP16Info
(
int
argc
,
...);
void
SetFP16Info
(
int
argc
,
...);
void
SetFP32Info
(
int
argc
,
...);
void
SetFP32Info
(
int
argc
,
...);
...
...
lite/core/mir/mlu_postprocess_pass.cc
浏览文件 @
7c26bc2e
...
@@ -569,11 +569,11 @@ void MLUPostprocessPass::Apply(const std::unique_ptr<SSAGraph>& graph) {
...
@@ -569,11 +569,11 @@ void MLUPostprocessPass::Apply(const std::unique_ptr<SSAGraph>& graph) {
// 1: feed->arg_in->subgraph->... 2: ...->subgraph->arg_out->fetch;
// 1: feed->arg_in->subgraph->... 2: ...->subgraph->arg_out->fetch;
// arg_in and arg_out are assumed to be NHWC which user should be aware of.
// arg_in and arg_out are assumed to be NHWC which user should be aware of.
// Thus here we change these args' layout to NHWC
// Thus here we change these args' layout to NHWC
if
(
lite
::
DeviceInfo
::
Global
().
InputLayout
()
==
DATALAYOUT
(
kNHWC
))
{
if
(
lite
::
TargetWrapperMlu
::
InputLayout
()
==
DATALAYOUT
(
kNHWC
))
{
ModifyLayout
(
graph
.
get
());
ModifyLayout
(
graph
.
get
());
}
}
if
(
lite
::
DeviceInfo
::
Global
().
UseFirstConv
())
{
if
(
lite
::
TargetWrapperMlu
::
UseFirstConv
())
{
GatherAndModifyFirstConvNodes
(
graph
.
get
());
GatherAndModifyFirstConvNodes
(
graph
.
get
());
}
}
...
...
lite/kernels/mlu/bridges/conv_op.cc
浏览文件 @
7c26bc2e
...
@@ -164,7 +164,7 @@ int ConvConverter(void* ctx, OpLite* op, KernelBase* kernel) {
...
@@ -164,7 +164,7 @@ int ConvConverter(void* ctx, OpLite* op, KernelBase* kernel) {
const
auto
input_scale
=
op_info
->
GetAttr
<
float
>
(
"input_scale"
);
const
auto
input_scale
=
op_info
->
GetAttr
<
float
>
(
"input_scale"
);
bool
use_first_conv
=
false
;
bool
use_first_conv
=
false
;
if
(
lite
::
DeviceInfo
::
Global
().
UseFirstConv
()
&&
input_dims
[
1
]
==
3
)
{
if
(
lite
::
TargetWrapperMlu
::
UseFirstConv
()
&&
input_dims
[
1
]
==
3
)
{
use_first_conv
=
true
;
use_first_conv
=
true
;
}
}
...
@@ -192,11 +192,11 @@ int ConvConverter(void* ctx, OpLite* op, KernelBase* kernel) {
...
@@ -192,11 +192,11 @@ int ConvConverter(void* ctx, OpLite* op, KernelBase* kernel) {
graph
->
FPType
());
graph
->
FPType
());
graph
->
BindConstRawData
(
"first_conv_mean_tensor"
,
graph
->
BindConstRawData
(
"first_conv_mean_tensor"
,
lite
::
DeviceInfo
::
Global
().
MeanVec
().
data
(),
lite
::
TargetWrapperMlu
::
MeanVec
().
data
(),
3
,
3
,
false
);
false
);
graph
->
BindConstRawData
(
"first_conv_std_tensor"
,
graph
->
BindConstRawData
(
"first_conv_std_tensor"
,
lite
::
DeviceInfo
::
Global
().
StdVec
().
data
(),
lite
::
TargetWrapperMlu
::
StdVec
().
data
(),
3
,
3
,
false
);
false
);
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录