Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle-Lite
提交
13072661
P
Paddle-Lite
项目概览
PaddlePaddle
/
Paddle-Lite
通知
332
Star
4
Fork
1
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
271
列表
看板
标记
里程碑
合并请求
78
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle-Lite
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
271
Issue
271
列表
看板
标记
里程碑
合并请求
78
合并请求
78
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
13072661
编写于
6月 25, 2020
作者:
H
hong19860320
提交者:
GitHub
6月 25, 2020
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
[Core] Fix the test framework for XPU (#3841)
上级
a8d75d20
变更
7
隐藏空白更改
内联
并排
Showing
7 changed file
with
152 addition
and
161 deletion
+152
-161
lite/core/arena/framework.cc
lite/core/arena/framework.cc
+81
-101
lite/core/arena/framework.h
lite/core/arena/framework.h
+36
-37
lite/core/scope.h
lite/core/scope.h
+20
-3
lite/tests/kernels/box_clip_compute_test.cc
lite/tests/kernels/box_clip_compute_test.cc
+1
-3
lite/tests/kernels/roi_align_compute_test.cc
lite/tests/kernels/roi_align_compute_test.cc
+1
-3
lite/tests/kernels/slice_compute_test.cc
lite/tests/kernels/slice_compute_test.cc
+6
-11
lite/tests/kernels/softmax_compute_test.cc
lite/tests/kernels/softmax_compute_test.cc
+7
-3
未找到文件。
lite/core/arena/framework.cc
浏览文件 @
13072661
...
...
@@ -55,7 +55,7 @@ void TestCase::CreateInstruction() {
op
=
LiteOpRegistry
::
Global
().
Create
(
op_desc
().
Type
());
}
CHECK
(
op
)
<<
"no op for "
<<
op_desc
().
Type
();
op
->
Attach
(
*
op_desc_
,
inst_scope_
);
op
->
Attach
(
*
op_desc_
,
inst_scope_
.
get
()
);
auto
kernels
=
op
->
CreateKernels
({
place_
});
// filter out the target kernel
CHECK
(
!
kernels
.
empty
())
<<
"No kernel found for place "
...
...
@@ -80,54 +80,35 @@ void TestCase::CreateInstruction() {
void
TestCase
::
PrepareInputsForInstruction
()
{
for
(
auto
&
arg
:
op_desc
().
InputArgumentNames
())
{
for
(
auto
&
var
:
op_desc
().
Input
(
arg
))
{
std
::
string
kernel_key
=
instruction_
->
kernel
()
->
key_with_alias
();
const
auto
*
param_type
=
ParamTypeRegistry
::
Global
().
RetrieveInArgument
(
place_
,
kernel_key
,
arg
);
const
Type
*
inst_type
=
nullptr
;
if
(
param_type
->
type
->
IsTensor
())
{
inst_type
=
Type
::
GetTensorTy
(
TARGET
(
kHost
));
}
else
if
(
param_type
->
type
->
IsTensorList
())
{
inst_type
=
Type
::
GetTensorListTy
(
TARGET
(
kHost
));
}
else
{
LOG
(
FATAL
)
<<
"unsupported param_type"
;
}
CHECK
(
scope_
->
FindVar
(
var
));
if
(
!
TargetCompatibleTo
(
*
inst_type
,
*
param_type
->
type
))
{
/// Create a tensor or tensor_array in the instruction's scope,
/// alloc memory and then copy data there.
if
(
param_type
->
type
->
IsTensor
())
{
const
auto
*
shared_tensor
=
scope_
->
FindTensor
(
var
);
auto
*
target_tensor
=
inst_scope_
->
LocalVar
(
var
)
->
GetMutable
<
Tensor
>
();
CHECK
(
!
shared_tensor
->
dims
().
empty
())
<<
"shared_tensor is empty yet"
;
target_tensor
->
Resize
(
shared_tensor
->
dims
());
TargetCopy
(
param_type
->
type
->
target
(),
target_tensor
->
mutable_data
(
param_type
->
type
->
target
(),
shared_tensor
->
memory_size
()),
shared_tensor
->
raw_data
(),
shared_tensor
->
memory_size
());
}
else
if
(
param_type
->
type
->
IsTensorList
())
{
const
auto
*
shared_tensor_array
=
scope_
->
FindVar
(
var
)
->
GetMutable
<
std
::
vector
<
Tensor
>>
();
auto
*
target_tensor_array
=
inst_scope_
->
LocalVar
(
var
)
->
GetMutable
<
std
::
vector
<
Tensor
>>
();
CHECK
(
!
shared_tensor_array
->
empty
())
<<
"shared_tensor_array is empty yet"
;
target_tensor_array
->
resize
(
shared_tensor_array
->
size
());
for
(
size_t
i
=
0
;
i
<
shared_tensor_array
->
size
();
i
++
)
{
target_tensor_array
->
at
(
i
).
Resize
(
shared_tensor_array
->
at
(
i
).
dims
());
TargetCopy
(
param_type
->
type
->
target
(),
target_tensor_array
->
at
(
i
).
mutable_data
(
param_type
->
type
->
target
(),
shared_tensor_array
->
at
(
i
).
memory_size
()),
shared_tensor_array
->
at
(
i
).
raw_data
(),
shared_tensor_array
->
at
(
i
).
memory_size
());
}
}
else
{
LOG
(
FATAL
)
<<
"not support"
;
const
auto
*
type
=
instruction_
->
kernel
()
->
GetInputDeclType
(
arg
);
CHECK
(
base_scope_
->
FindVar
(
var
));
/// Create a tensor or tensor_array in the instruction's scope,
/// alloc memory and then copy data there.
if
(
type
->
IsTensor
()
&&
!
TargetCompatibleTo
(
*
Type
::
GetTensorTy
(
TARGET
(
kHost
)),
*
type
))
{
const
auto
*
base_tensor
=
base_scope_
->
FindTensor
(
var
);
auto
*
inst_tensor
=
inst_scope_
->
FindMutableTensor
(
var
);
CHECK
(
!
base_tensor
->
dims
().
empty
())
<<
"The dims of input tensor is empty yet"
;
TargetCopy
(
type
->
target
(),
inst_tensor
->
mutable_data
(
type
->
target
(),
base_tensor
->
memory_size
()),
base_tensor
->
raw_data
(),
base_tensor
->
memory_size
());
}
else
if
(
type
->
IsTensorList
()
&&
!
TargetCompatibleTo
(
*
Type
::
GetTensorListTy
(
TARGET
(
kHost
)),
*
type
))
{
const
auto
*
base_tensor_list
=
base_scope_
->
FindTensorList
(
var
);
auto
*
inst_tensor_list
=
inst_scope_
->
FindMutableTensorList
(
var
);
CHECK_EQ
(
base_tensor_list
->
size
(),
inst_tensor_list
->
size
());
for
(
size_t
i
=
0
;
i
<
base_tensor_list
->
size
();
i
++
)
{
CHECK
(
!
base_tensor_list
->
at
(
i
).
dims
().
empty
())
<<
"The dims of input tensor["
<<
i
<<
"] is empty yet"
;
TargetCopy
(
type
->
target
(),
inst_tensor_list
->
at
(
i
).
mutable_data
(
type
->
target
(),
base_tensor_list
->
at
(
i
).
memory_size
()),
inst_tensor_list
->
at
(
i
).
raw_data
(),
inst_tensor_list
->
at
(
i
).
memory_size
());
}
}
}
...
...
@@ -135,37 +116,36 @@ void TestCase::PrepareInputsForInstruction() {
}
template
<
typename
T
>
bool
TestCase
::
CheckTensorPrecision
(
const
Tensor
*
a
_tensor
,
const
Tensor
*
b_tensor
,
bool
TestCase
::
CheckTensorPrecision
(
const
Tensor
*
inst
_tensor
,
const
Tensor
*
b
ase
_tensor
,
float
abs_error
)
{
CHECK
(
a
_tensor
);
CHECK
(
b_tensor
);
CHECK
(
inst
_tensor
);
CHECK
(
b
ase
_tensor
);
CHECK
(
ShapeEquals
(
a_tensor
->
dims
(),
b
_tensor
->
dims
()));
CHECK
(
ShapeEquals
(
inst_tensor
->
dims
(),
base
_tensor
->
dims
()));
CHECK
(
a_tensor
->
lod
()
==
b
_tensor
->
lod
())
<<
"lod not match"
;
CHECK
(
inst_tensor
->
lod
()
==
base
_tensor
->
lod
())
<<
"lod not match"
;
// The baseline should output in host devices.
CHECK
(
b_tensor
->
target
()
==
TARGET
(
kHost
)
||
b_tensor
->
target
()
==
TARGET
(
kX86
)
||
b_tensor
->
target
()
==
TARGET
(
kARM
));
const
T
*
a_data
{};
Tensor
a_host_tensor
;
a_host_tensor
.
Resize
(
a_tensor
->
dims
());
switch
(
a_tensor
->
target
())
{
CHECK
(
base_tensor
->
target
()
==
TARGET
(
kHost
)
||
base_tensor
->
target
()
==
TARGET
(
kX86
)
||
base_tensor
->
target
()
==
TARGET
(
kARM
));
const
T
*
inst_data
{};
Tensor
inst_host_tensor
;
inst_host_tensor
.
Resize
(
inst_tensor
->
dims
());
switch
(
inst_tensor
->
target
())
{
case
TARGET
(
kX86
):
case
TARGET
(
kHost
):
case
TARGET
(
kARM
):
a_data
=
static_cast
<
const
T
*>
(
a
_tensor
->
raw_data
());
inst_data
=
static_cast
<
const
T
*>
(
inst
_tensor
->
raw_data
());
break
;
#ifdef LITE_WITH_XPU
case
TARGET
(
kXPU
):
CopySync
<
TARGET
(
kXPU
)
>
(
a
_host_tensor
.
mutable_data
<
T
>
(),
a
_tensor
->
raw_data
(),
sizeof
(
T
)
*
a
_tensor
->
dims
().
production
(),
CopySync
<
TARGET
(
kXPU
)
>
(
inst
_host_tensor
.
mutable_data
<
T
>
(),
inst
_tensor
->
raw_data
(),
sizeof
(
T
)
*
inst
_tensor
->
dims
().
production
(),
IoDirection
::
DtoH
);
a_data
=
a
_host_tensor
.
data
<
T
>
();
inst_data
=
inst
_host_tensor
.
data
<
T
>
();
break
;
#endif
...
...
@@ -174,50 +154,50 @@ bool TestCase::CheckTensorPrecision(const Tensor* a_tensor,
LOG
(
FATAL
)
<<
"Not supported"
;
}
CHECK
(
a
_data
);
CHECK
(
inst
_data
);
const
T
*
b
_data
=
static_cast
<
const
T
*>
(
b
_tensor
->
raw_data
());
const
T
*
b
ase_data
=
static_cast
<
const
T
*>
(
base
_tensor
->
raw_data
());
bool
success
=
true
;
for
(
int
i
=
0
;
i
<
a
_tensor
->
dims
().
production
();
i
++
)
{
EXPECT_NEAR
(
a_data
[
i
],
b
_data
[
i
],
abs_error
);
if
(
fabsf
(
a_data
[
i
]
-
b
_data
[
i
])
>
abs_error
)
{
for
(
int
i
=
0
;
i
<
inst
_tensor
->
dims
().
production
();
i
++
)
{
EXPECT_NEAR
(
inst_data
[
i
],
base
_data
[
i
],
abs_error
);
if
(
fabsf
(
inst_data
[
i
]
-
base
_data
[
i
])
>
abs_error
)
{
success
=
false
;
}
}
return
success
;
}
bool
TestCase
::
CheckPrecision
(
const
Tensor
*
a
_tensor
,
const
Tensor
*
b_tensor
,
bool
TestCase
::
CheckPrecision
(
const
Tensor
*
inst
_tensor
,
const
Tensor
*
b
ase
_tensor
,
float
abs_error
,
PrecisionType
precision_type
)
{
PrecisionType
precision_type_t
=
precision_type
;
if
(
precision_type
==
PRECISION
(
kAny
))
{
precision_type_t
=
b_tensor
->
precision
();
precision_type_t
=
b
ase
_tensor
->
precision
();
}
CHECK
(
precision_type_t
==
b_tensor
->
precision
())
CHECK
(
precision_type_t
==
b
ase
_tensor
->
precision
())
<<
"arg precision type and base tensor precision type are not matched! "
"arg precision type is: "
<<
PrecisionToStr
(
precision_type
)
<<
", base tensor precision type is: "
<<
PrecisionToStr
(
b_tensor
->
precision
());
CHECK
(
a_tensor
->
precision
()
==
b
_tensor
->
precision
())
<<
PrecisionToStr
(
b
ase
_tensor
->
precision
());
CHECK
(
inst_tensor
->
precision
()
==
base
_tensor
->
precision
())
<<
"real tensor precision type and base tensor precision type are not "
"matched! real tensor precision type is: "
<<
PrecisionToStr
(
a
_tensor
->
precision
())
<<
PrecisionToStr
(
inst
_tensor
->
precision
())
<<
", base tensor precision type is: "
<<
PrecisionToStr
(
b_tensor
->
precision
());
<<
PrecisionToStr
(
b
ase
_tensor
->
precision
());
switch
(
precision_type_t
)
{
case
PRECISION
(
kFloat
):
return
CheckTensorPrecision
<
float
>
(
a_tensor
,
b
_tensor
,
abs_error
);
return
CheckTensorPrecision
<
float
>
(
inst_tensor
,
base
_tensor
,
abs_error
);
case
PRECISION
(
kInt8
):
return
CheckTensorPrecision
<
int8_t
>
(
a_tensor
,
b
_tensor
,
abs_error
);
return
CheckTensorPrecision
<
int8_t
>
(
inst_tensor
,
base
_tensor
,
abs_error
);
case
PRECISION
(
kInt32
):
return
CheckTensorPrecision
<
int32_t
>
(
a_tensor
,
b
_tensor
,
abs_error
);
return
CheckTensorPrecision
<
int32_t
>
(
inst_tensor
,
base
_tensor
,
abs_error
);
case
PRECISION
(
kInt64
):
return
CheckTensorPrecision
<
int64_t
>
(
a_tensor
,
b
_tensor
,
abs_error
);
return
CheckTensorPrecision
<
int64_t
>
(
inst_tensor
,
base
_tensor
,
abs_error
);
case
PRECISION
(
kBool
):
return
CheckTensorPrecision
<
bool
>
(
a_tensor
,
b
_tensor
,
abs_error
);
return
CheckTensorPrecision
<
bool
>
(
inst_tensor
,
base
_tensor
,
abs_error
);
default:
LOG
(
FATAL
)
<<
"not support type: "
<<
PrecisionToStr
(
precision_type
);
return
false
;
...
...
@@ -229,24 +209,24 @@ bool TestCase::CheckPrecision(const std::string& var_name,
PrecisionType
precision_type
)
{
bool
success
=
true
;
if
(
inst_scope_
->
FindVar
(
var_name
)
->
IsType
<
Tensor
>
())
{
auto
a_tensor
=
inst_scope_
->
FindTensor
(
var_name
);
auto
b_tensor
=
base_scope_
->
FindTensor
(
var_name
);
success
=
success
&&
CheckPrecision
(
a_tensor
,
b_tensor
,
abs_error
,
precision_type
);
auto
inst_tensor
=
inst_scope_
->
FindTensor
(
var_name
);
auto
base_tensor
=
base_scope_
->
FindTensor
(
var_name
);
success
=
success
&&
CheckPrecision
(
inst_tensor
,
base_tensor
,
abs_error
,
precision_type
);
}
else
if
(
inst_scope_
->
FindVar
(
var_name
)
->
IsType
<
std
::
vector
<
Tensor
>>
())
{
auto
a_tensor_array
=
inst_scope_
->
FindVar
(
var_name
)
->
GetMutable
<
std
::
vector
<
Tensor
>>
();
auto
b_tensor_array
=
base_scope_
->
FindVar
(
var_name
)
->
GetMutable
<
std
::
vector
<
Tensor
>>
();
CHECK_EQ
(
a_tensor_array
->
size
(),
b_tensor_array
->
size
());
for
(
size_t
i
=
0
;
i
<
a_tensor_array
->
size
();
i
++
)
{
Tensor
*
a_tensor
=
&
(
a_tensor_array
->
at
(
i
));
Tensor
*
b_tensor
=
&
(
b_tensor_array
->
at
(
i
));
if
(
a_tensor
->
dims
().
size
()
==
0
&&
b_tensor
->
dims
().
size
()
==
0
)
{
auto
inst_tensor_list
=
inst_scope_
->
FindMutableTensorList
(
var_name
);
auto
base_tensor_list
=
base_scope_
->
FindMutableTensorList
(
var_name
);
CHECK_EQ
(
inst_tensor_list
->
size
(),
base_tensor_list
->
size
());
for
(
size_t
i
=
0
;
i
<
inst_tensor_list
->
size
();
i
++
)
{
Tensor
*
inst_tensor
=
&
(
inst_tensor_list
->
at
(
i
));
Tensor
*
base_tensor
=
&
(
base_tensor_list
->
at
(
i
));
if
(
inst_tensor
->
dims
().
size
()
==
0
&&
base_tensor
->
dims
().
size
()
==
0
)
{
continue
;
}
success
=
success
&&
CheckPrecision
(
a_tensor
,
b_tensor
,
abs_error
,
precision_type
);
success
=
success
&&
CheckPrecision
(
inst_tensor
,
base_tensor
,
abs_error
,
precision_type
);
}
}
else
{
LOG
(
FATAL
)
<<
"unsupported var type"
;
...
...
lite/core/arena/framework.h
浏览文件 @
13072661
...
...
@@ -40,13 +40,15 @@ namespace arena {
class
TestCase
{
public:
explicit
TestCase
(
const
Place
&
place
,
const
std
::
string
&
alias
)
:
place_
(
place
),
scope_
(
new
Scope
),
alias_
(
alias
)
{
:
place_
(
place
),
alias_
(
alias
),
inst_scope_
(
new
Scope
),
base_scope_
(
new
Scope
)
{
ctx_
=
ContextScheduler
::
Global
().
NewContext
(
place_
.
target
);
}
virtual
~
TestCase
();
void
Prepare
()
{
PrepareScopes
();
PrepareData
();
op_desc_
.
reset
(
new
cpp
::
OpDesc
);
PrepareOpDesc
(
op_desc_
.
get
());
...
...
@@ -91,16 +93,15 @@ class TestCase {
// kernel registry.
void
CheckKernelConsistWithDefinition
()
{}
Scope
&
scope
()
{
return
*
scope_
;
}
Scope
*
baseline_scope
()
{
return
base_scope_
;
}
Scope
*
inst_scope
()
{
return
inst_scope_
;
}
Scope
*
baseline_scope
()
{
return
base_scope_
.
get
();
}
Scope
*
inst_scope
()
{
return
inst_scope_
.
get
();
}
protected:
// Prepare inputs in scope() for Tester.
virtual
void
PrepareData
()
=
0
;
/// Prepare a tensor in host. The tensors will be created in scope_.
/// Prepare a tensor in host. The tensors will be created both in base_scope_
/// and inst_scope_.
/// Need to specify the targets other than X86 or ARM.
template
<
typename
T
>
void
SetCommonTensor
(
const
std
::
string
&
var_name
,
...
...
@@ -108,42 +109,47 @@ class TestCase {
const
T
*
data
,
const
LoD
&
lod
=
{},
bool
is_persistable
=
false
)
{
auto
*
tensor
=
scope_
->
NewTensor
(
var_name
);
tensor
->
Resize
(
ddim
);
auto
*
d
=
tensor
->
mutable_data
<
T
>
(
);
memcpy
(
d
,
data
,
ddim
.
production
()
*
sizeof
(
T
));
// Create and fill a input tensor with the given data for baseline
auto
*
base_tensor
=
base_scope_
->
NewTensor
(
var_name
);
base_tensor
->
Resize
(
ddim
);
memcpy
(
base_tensor
->
mutable_data
<
T
>
()
,
data
,
ddim
.
production
()
*
sizeof
(
T
));
// set lod
if
(
!
lod
.
empty
())
*
tensor
->
mutable_lod
()
=
lod
;
if
(
!
lod
.
empty
())
*
base_
tensor
->
mutable_lod
()
=
lod
;
// set persistable
tensor
->
set_persistable
(
is_persistable
);
base_tensor
->
set_persistable
(
is_persistable
);
// Create a copy for instruction
auto
*
inst_tensor
=
inst_scope_
->
NewTensor
(
var_name
);
inst_tensor
->
CopyDataFrom
(
*
base_tensor
);
}
/// Prepare a tensor_array in host. The tensors will be created in scope_.
/// Need to specify the targets other than X86 or ARM.
template
<
typename
T
>
void
SetCommonTensorList
(
const
std
::
string
&
var_name
,
const
std
::
vector
<
DDim
>&
array_tensor_
dims
,
const
std
::
vector
<
DDim
>&
d
dims
,
const
std
::
vector
<
std
::
vector
<
T
>>&
datas
,
const
std
::
vector
<
LoD
>&
lods
=
{})
{
CHECK_EQ
(
array_tensor_dims
.
size
(),
datas
.
size
());
// Create a tensor array for baseline, and a copy for instruction
CHECK_EQ
(
ddims
.
size
(),
datas
.
size
());
if
(
!
lods
.
empty
())
{
CHECK_EQ
(
array_tensor_
dims
.
size
(),
lods
.
size
());
CHECK_EQ
(
d
dims
.
size
(),
lods
.
size
());
}
auto
*
tensor_array
=
scope_
->
Var
(
var_name
)
->
GetMutable
<
std
::
vector
<
Tensor
>>
();
for
(
int
i
=
0
;
i
<
array_tensor_dims
.
size
();
i
++
)
{
Tensor
tmp
;
tmp
.
Resize
(
array_tensor_dims
[
i
]);
auto
*
tmp_data
=
tmp
.
mutable_data
<
T
>
();
memcpy
(
tmp_data
,
auto
*
base_tensor_list
=
base_scope_
->
NewTensorList
(
var_name
);
auto
*
inst_tensor_list
=
inst_scope_
->
NewTensorList
(
var_name
);
for
(
int
i
=
0
;
i
<
ddims
.
size
();
i
++
)
{
Tensor
item
;
item
.
Resize
(
ddims
[
i
]);
memcpy
(
item
.
mutable_data
<
T
>
(),
datas
[
i
].
data
(),
array_tensor_
dims
[
i
].
production
()
*
sizeof
(
T
));
d
dims
[
i
].
production
()
*
sizeof
(
T
));
if
(
!
lods
.
empty
())
{
tmp
.
set_lod
(
lods
[
i
]);
item
.
set_lod
(
lods
[
i
]);
}
tensor_array
->
push_back
(
tmp
);
base_tensor_list
->
push_back
(
item
);
inst_tensor_list
->
push_back
(
item
);
}
}
...
...
@@ -157,11 +163,6 @@ class TestCase {
std
::
unique_ptr
<
KernelContext
>
ctx_
;
void
CreateInstruction
();
void
PrepareScopes
()
{
inst_scope_
=
&
scope_
->
NewScope
();
base_scope_
=
&
scope_
->
NewScope
();
}
// Check shape
// TODO(Superjomn) Move this method to utils or DDim?
bool
ShapeEquals
(
const
DDim
&
a
,
const
DDim
&
b
)
{
...
...
@@ -172,25 +173,23 @@ class TestCase {
return
true
;
}
//
/ Copy the input tensors to target devices
needed by the instruction.
//
Copy the host tensors to the device tensors if
needed by the instruction.
void
PrepareInputsForInstruction
();
// Create output tensors and variables.
void
PrepareOutputsForInstruction
()
{
for
(
auto
x
:
op_desc
().
output_vars
())
{
inst_scope_
->
NewTensor
(
x
);
base_scope_
->
NewTensor
(
x
);
inst_scope_
->
Var
(
x
);
}
}
private:
Place
place_
;
std
::
shared_ptr
<
Scope
>
scope_
;
std
::
string
alias_
;
// The workspace for the Instruction.
Scope
*
inst_scope_
{}
;
std
::
shared_ptr
<
Scope
>
inst_scope_
;
// The workspace for the baseline implementation.
Scope
*
base_scope_
{}
;
std
::
shared_ptr
<
Scope
>
base_scope_
;
std
::
unique_ptr
<
cpp
::
OpDesc
>
op_desc_
;
std
::
unique_ptr
<
Instruction
>
instruction_
;
};
...
...
lite/core/scope.h
浏览文件 @
13072661
...
...
@@ -62,19 +62,36 @@ class Scope final {
// Create a Tensor variable. This will create a new Variable called `name`.
Tensor
*
NewTensor
(
const
std
::
string
&
name
)
{
auto
*
var
=
Var
(
name
);
return
var
->
GetMutable
<
Tensor
Lite
>
();
return
var
->
GetMutable
<
Tensor
>
();
}
const
Tensor
*
FindTensor
(
const
std
::
string
&
name
)
{
auto
*
var
=
FindVar
(
name
);
if
(
!
var
)
return
nullptr
;
return
&
var
->
Get
<
Tensor
Lite
>
();
return
&
var
->
Get
<
Tensor
>
();
}
Tensor
*
FindMutableTensor
(
const
std
::
string
&
name
)
{
auto
*
var
=
FindVar
(
name
);
if
(
!
var
)
return
nullptr
;
return
var
->
GetMutable
<
TensorLite
>
();
return
var
->
GetMutable
<
Tensor
>
();
}
std
::
vector
<
Tensor
>*
NewTensorList
(
const
std
::
string
&
name
)
{
auto
*
var
=
Var
(
name
);
return
var
->
GetMutable
<
std
::
vector
<
Tensor
>>
();
}
const
std
::
vector
<
Tensor
>*
FindTensorList
(
const
std
::
string
&
name
)
{
auto
*
var
=
FindVar
(
name
);
if
(
!
var
)
return
nullptr
;
return
&
var
->
Get
<
std
::
vector
<
Tensor
>>
();
}
std
::
vector
<
Tensor
>*
FindMutableTensorList
(
const
std
::
string
&
name
)
{
auto
*
var
=
FindVar
(
name
);
if
(
!
var
)
return
nullptr
;
return
var
->
GetMutable
<
std
::
vector
<
Tensor
>>
();
}
private:
...
...
lite/tests/kernels/box_clip_compute_test.cc
浏览文件 @
13072661
...
...
@@ -70,9 +70,7 @@ class BoxClipComputeTester : public arena::TestCase {
float
sign
=
i
%
3
==
0
?
-
1.0
f
:
1.0
f
;
input_data
[
i
]
=
sign
*
static_cast
<
float
>
((
i
*
7
)
%
20
);
}
SetCommonTensor
(
input_
,
input_dims_
,
input_data
.
data
());
auto
input_tensor
=
baseline_scope
()
->
FindMutableTensor
(
input_
);
input_tensor
->
set_lod
(
input_lod_
);
SetCommonTensor
(
input_
,
input_dims_
,
input_data
.
data
(),
input_lod_
);
std
::
vector
<
float
>
im_info_data
{
10
,
10
,
1
,
15
,
15
,
1
};
SetCommonTensor
(
im_info_
,
im_info_dim_
,
im_info_data
.
data
());
...
...
lite/tests/kernels/roi_align_compute_test.cc
浏览文件 @
13072661
...
...
@@ -106,13 +106,11 @@ class RoiAlignComputeTester : public arena::TestCase {
}
LOG
(
INFO
)
<<
"Read rois data. "
<<
datas
[
0
]
<<
" "
<<
datas
.
back
();
reader
.
close
();
SetCommonTensor
(
rois_
,
dims
,
datas
.
data
());
auto
rois_tensor
=
baseline_scope
()
->
FindMutableTensor
(
rois_
);
std
::
vector
<
uint64_t
>
lod0
({
0
,
152
,
304
});
LoD
lod
;
lod
.
push_back
(
lod0
);
rois_tensor
->
set_lod
(
lod
);
SetCommonTensor
(
rois_
,
dims
,
datas
.
data
(),
lod
);
}
};
...
...
lite/tests/kernels/slice_compute_test.cc
浏览文件 @
13072661
...
...
@@ -202,20 +202,15 @@ class SliceComputeTester : public arena::TestCase {
DDim
({
static_cast
<
int64_t
>
(
ends_
.
size
())}),
ends_
.
data
());
}
else
if
(
use_tensor_list_
)
{
Scope
&
scope_
=
this
->
scope
();
for
(
int
i
=
0
;
i
<
starts_
.
size
();
++
i
)
{
auto
*
tensor
=
scope_
.
NewTensor
(
"starts_tensor_list_"
+
paddle
::
lite
::
to_string
(
i
));
tensor
->
Resize
(
DDim
({
1
}));
auto
*
d
=
tensor
->
mutable_data
<
int
>
();
d
[
0
]
=
starts_
[
i
];
SetCommonTensor
(
"starts_tensor_list_"
+
paddle
::
lite
::
to_string
(
i
),
DDim
({
1
}),
&
starts_
[
i
]);
}
for
(
int
i
=
0
;
i
<
ends_
.
size
();
++
i
)
{
auto
*
tensor
=
scope_
.
NewTensor
(
"ends_tensor_list_"
+
paddle
::
lite
::
to_string
(
i
));
tensor
->
Resize
(
DDim
({
1
}));
auto
*
d
=
tensor
->
mutable_data
<
int
>
();
d
[
0
]
=
ends_
[
i
];
SetCommonTensor
(
"ends_tensor_list_"
+
paddle
::
lite
::
to_string
(
i
),
DDim
({
1
}),
&
ends_
[
i
]);
}
}
}
...
...
lite/tests/kernels/softmax_compute_test.cc
浏览文件 @
13072661
...
...
@@ -103,7 +103,7 @@ TEST(Softmax, precision) {
#if defined(LITE_WITH_NPU)
place
=
TARGET
(
kNPU
);
abs_error
=
4e-3
;
// Using fp16 in NPU
#elif defined(LITE_WITH_XPU)
&& defined(LITE_WITH_XTCL)
#elif defined(LITE_WITH_XPU)
place
=
TARGET
(
kXPU
);
#else
return
;
...
...
@@ -111,8 +111,12 @@ TEST(Softmax, precision) {
for
(
auto
x_dims
:
std
::
vector
<
std
::
vector
<
int64_t
>>
{{
1
,
2
,
3
,
4
},
{
2
,
3
,
4
},
{
3
,
4
}})
{
for
(
auto
axis
:
{
-
1
,
0
,
1
,
2
,
3
})
{
if
(
axis
>=
x_dims
.
size
())
continue
;
int
ndims
=
x_dims
.
size
();
for
(
int
axis
=
-
1
;
axis
<
ndims
;
axis
++
)
{
#if defined(LITE_WITH_XPU)
if
(
axis
!=
-
1
&&
axis
!=
ndims
-
1
)
continue
;
// -1 and dims.size() - 1 are only supported by XPU
#endif
std
::
unique_ptr
<
arena
::
TestCase
>
tester
(
new
SoftmaxComputeTest
(
place
,
"def"
,
DDim
(
x_dims
),
axis
));
arena
::
Arena
arena
(
std
::
move
(
tester
),
place
,
abs_error
);
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录