Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
机器未来
Paddle
提交
46161679
P
Paddle
项目概览
机器未来
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
46161679
编写于
2月 18, 2022
作者:
A
Allen Guo
提交者:
GitHub
2月 18, 2022
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
[IPU] Update IpuStrategy (#39644)
* Update IpuStrategy * fix ci * rerun ci
上级
bc3ca678
变更
12
显示空白变更内容
内联
并排
Showing
12 changed file
with
599 addition
and
75 deletion
+599
-75
cmake/external/poplar.cmake
cmake/external/poplar.cmake
+20
-12
paddle/fluid/framework/ir/ipu/forward_graph_extract_pass.cc
paddle/fluid/framework/ir/ipu/forward_graph_extract_pass.cc
+13
-0
paddle/fluid/framework/ir/ipu/inference_process_pass.cc
paddle/fluid/framework/ir/ipu/inference_process_pass.cc
+2
-2
paddle/fluid/operators/ipu/ipu_runtime_op.cc
paddle/fluid/operators/ipu/ipu_runtime_op.cc
+1
-2
paddle/fluid/platform/device/ipu/ipu_backend.cc
paddle/fluid/platform/device/ipu/ipu_backend.cc
+1
-1
paddle/fluid/platform/device/ipu/ipu_backend.h
paddle/fluid/platform/device/ipu/ipu_backend.h
+1
-1
paddle/fluid/platform/device/ipu/ipu_compiler.cc
paddle/fluid/platform/device/ipu/ipu_compiler.cc
+3
-5
paddle/fluid/platform/device/ipu/ipu_executor.cc
paddle/fluid/platform/device/ipu/ipu_executor.cc
+8
-3
paddle/fluid/platform/device/ipu/ipu_strategy.cc
paddle/fluid/platform/device/ipu/ipu_strategy.cc
+432
-4
paddle/fluid/platform/device/ipu/ipu_strategy.h
paddle/fluid/platform/device/ipu/ipu_strategy.h
+79
-41
paddle/fluid/platform/device/ipu/ipu_utils.cc
paddle/fluid/platform/device/ipu/ipu_utils.cc
+35
-2
paddle/fluid/platform/device/ipu/ipu_utils.h
paddle/fluid/platform/device/ipu/ipu_utils.h
+4
-2
未找到文件。
cmake/external/poplar.cmake
浏览文件 @
46161679
...
@@ -11,31 +11,35 @@
...
@@ -11,31 +11,35 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# See the License for the specific language governing permissions and
# limitations under the License.
# limitations under the License.
if
(
WITH_IPU
)
if
(
WITH_IPU
)
set
(
POPLAR_DIR CACHE PATH
"Path to a Poplar install"
)
set
(
POPLAR_DIR CACHE PATH
"Path to a Poplar install"
)
set
(
POPART_DIR CACHE PATH
"Path to a Popart install"
)
set
(
POPART_DIR CACHE PATH
"Path to a Popart install"
)
set
(
POPLAR_SDK_DIR CACHE PATH
"Path to an extracted SDK archive or to a Poplar & Popart install directory (Will populate POPLAR_DIR and POPART_DIR)"
)
set
(
POPLAR_SDK_DIR CACHE PATH
"Path to an extracted SDK archive or to a Poplar & Popart install directory (Will populate POPLAR_DIR and POPART_DIR)"
)
# support setting SDK both from environment variable or command line arguments
if
(
DEFINED ENV{POPLAR_SDK_DIR}
)
if
(
DEFINED ENV{POPLAR_SDK_DIR}
)
set
(
POPLAR_SDK_DIR $ENV{POPLAR_SDK_DIR}
)
set
(
POPLAR_SDK_DIR $ENV{POPLAR_SDK_DIR}
)
endif
()
if
(
EXISTS
${
POPLAR_SDK_DIR
}
)
execute_process
(
COMMAND find
${
POPLAR_SDK_DIR
}
/ -maxdepth 1 -type d -name
"popart*"
execute_process
(
COMMAND find
${
POPLAR_SDK_DIR
}
/ -maxdepth 1 -type d -name
"popart*"
OUTPUT_VARIABLE POPART_DIR OUTPUT_STRIP_TRAILING_WHITESPACE
)
OUTPUT_VARIABLE POPART_DIR OUTPUT_STRIP_TRAILING_WHITESPACE
)
execute_process
(
COMMAND find
${
POPLAR_SDK_DIR
}
/ -maxdepth 1 -type d -name
"poplar-*"
-o -name
"poplar"
execute_process
(
COMMAND find
${
POPLAR_SDK_DIR
}
/ -maxdepth 1 -type d -name
"poplar-*"
-o -name
"poplar"
OUTPUT_VARIABLE POPLAR_DIR OUTPUT_STRIP_TRAILING_WHITESPACE
)
OUTPUT_VARIABLE POPLAR_DIR OUTPUT_STRIP_TRAILING_WHITESPACE
)
if
(
NOT IS_DIRECTORY
"
${
POPLAR_DIR
}
"
)
message
(
FATAL_ERROR
"Couldn't find a
\"
poplar
\"
or
\"
poplar-*
\"
folder in '
${
POPLAR_SDK_DIR
}
'"
)
endif
()
endif
()
if
(
NOT IS_DIRECTORY
"
${
POPART_DIR
}
"
)
if
(
DEFINED ENV{POPLAR_DIR}
)
message
(
FATAL_ERROR
"Couldn't find a
\"
popart*
\"
folder in '
${
POPLAR_SDK_DIR
}
'"
)
set
(
POPLAR_DIR $ENV{POPLAR_DIR}
)
endif
()
endif
()
else
(
)
if
(
DEFINED ENV{POPART_DIR}
)
message
(
FATAL_ERROR
"You must provide a path to a Poplar install using export POPLAR_SDK_DIR=/path/to/poplar_sdk"
)
set
(
POPART_DIR $ENV{POPART_DIR}
)
endif
()
endif
()
message
(
"POPLAR_DIR is
${
POPLAR_DIR
}
"
)
message
(
"POPART_DIR is
${
POPART_DIR
}
"
)
if
(
EXISTS
${
POPLAR_DIR
}
)
if
(
EXISTS
${
POPLAR_DIR
}
)
message
(
"POPLAR_DIR is
${
POPLAR_DIR
}
"
)
if
(
NOT IS_DIRECTORY
"
${
POPLAR_DIR
}
"
)
message
(
FATAL_ERROR
"Couldn't find a
\"
poplar
\"
or
\"
poplar-*
\"
folder in '
${
POPLAR_SDK_DIR
}
'"
)
endif
()
list
(
APPEND CMAKE_PREFIX_PATH
${
POPLAR_DIR
}
)
list
(
APPEND CMAKE_PREFIX_PATH
${
POPLAR_DIR
}
)
set
(
ENABLE_POPLAR_CMD
"source
${
POPLAR_DIR
}
/enable.sh"
)
set
(
ENABLE_POPLAR_CMD
"source
${
POPLAR_DIR
}
/enable.sh"
)
find_package
(
poplar REQUIRED
)
find_package
(
poplar REQUIRED
)
...
@@ -45,8 +49,11 @@ if(WITH_IPU)
...
@@ -45,8 +49,11 @@ if(WITH_IPU)
if
(
NOT poplar_FOUND
)
if
(
NOT poplar_FOUND
)
message
(
FATAL_ERROR
"You must provide a path to a Poplar install using -DPOPLAR_DIR=/path/to/popart/build/install"
)
message
(
FATAL_ERROR
"You must provide a path to a Poplar install using -DPOPLAR_DIR=/path/to/popart/build/install"
)
endif
()
endif
()
if
(
EXISTS
${
POPART_DIR
}
)
if
(
EXISTS
${
POPART_DIR
}
)
message
(
"POPART_DIR is
${
POPART_DIR
}
"
)
if
(
NOT IS_DIRECTORY
"
${
POPART_DIR
}
"
)
message
(
FATAL_ERROR
"Couldn't find a
\"
popart*
\"
folder in '
${
POPLAR_SDK_DIR
}
'"
)
endif
()
list
(
APPEND CMAKE_PREFIX_PATH
${
POPART_DIR
}
)
list
(
APPEND CMAKE_PREFIX_PATH
${
POPART_DIR
}
)
set
(
ENABLE_POPART_CMD
"source
${
POPART_DIR
}
/enable.sh"
)
set
(
ENABLE_POPART_CMD
"source
${
POPART_DIR
}
/enable.sh"
)
find_package
(
popart REQUIRED COMPONENTS popart-only
)
find_package
(
popart REQUIRED COMPONENTS popart-only
)
...
@@ -56,6 +63,7 @@ if(WITH_IPU)
...
@@ -56,6 +63,7 @@ if(WITH_IPU)
if
(
NOT popart_FOUND
)
if
(
NOT popart_FOUND
)
message
(
FATAL_ERROR
"You must provide a path to a Popart build using -DPOPART_DIR=/path/to/popart/build"
)
message
(
FATAL_ERROR
"You must provide a path to a Popart build using -DPOPART_DIR=/path/to/popart/build"
)
endif
()
endif
()
add_definitions
(
-DONNX_NAMESPACE=onnx
)
add_definitions
(
-DONNX_NAMESPACE=onnx
)
add_custom_target
(
extern_poplar DEPENDS poplar popart-only
)
add_custom_target
(
extern_poplar DEPENDS poplar popart-only
)
endif
()
endif
()
paddle/fluid/framework/ir/ipu/forward_graph_extract_pass.cc
浏览文件 @
46161679
...
@@ -64,6 +64,19 @@ void ForwardGraphExtractPass::ApplyImpl(ir::Graph* graph) const {
...
@@ -64,6 +64,19 @@ void ForwardGraphExtractPass::ApplyImpl(ir::Graph* graph) const {
}
}
}
}
}
}
// learning_rate var
for
(
auto
*
node
:
all_ops
[
OpRole
::
kOptimize
])
{
if
(
node
->
Op
()
->
Inputs
().
count
(
"LearningRate"
)
&&
!
node
->
Op
()
->
Inputs
().
at
(
"LearningRate"
).
empty
())
{
auto
lr_var_name
=
node
->
Op
()
->
Inputs
().
at
(
"LearningRate"
).
front
();
for
(
auto
*
in_var
:
node
->
inputs
)
{
if
(
in_var
->
Name
()
==
lr_var_name
)
{
VLOG
(
10
)
<<
"found LearningRate var: "
<<
in_var
->
Name
();
forward_vars
.
insert
(
in_var
);
}
}
}
}
// control_vars & backward_vars
// control_vars & backward_vars
for
(
auto
*
node
:
graph
->
Nodes
())
{
for
(
auto
*
node
:
graph
->
Nodes
())
{
if
(
!
node
->
IsVar
())
{
if
(
!
node
->
IsVar
())
{
...
...
paddle/fluid/framework/ir/ipu/inference_process_pass.cc
浏览文件 @
46161679
...
@@ -51,11 +51,11 @@ void InferenceProcessPass::ApplyImpl(ir::Graph* graph) const {
...
@@ -51,11 +51,11 @@ void InferenceProcessPass::ApplyImpl(ir::Graph* graph) const {
if
(
num_ipus
>
1
)
{
if
(
num_ipus
>
1
)
{
ipu_strategy_instance_
->
need_avg_shard
=
true
;
ipu_strategy_instance_
->
need_avg_shard
=
true
;
ipu_strategy_instance_
->
popart_options
.
virtualGraphMode
=
ipu_strategy_instance_
->
popart_options
.
virtualGraphMode
=
p
latform
::
ipu
::
VirtualGraphMode
::
Manual
;
p
opart
::
VirtualGraphMode
::
Manual
;
}
else
{
}
else
{
ipu_strategy_instance_
->
need_avg_shard
=
false
;
ipu_strategy_instance_
->
need_avg_shard
=
false
;
ipu_strategy_instance_
->
popart_options
.
virtualGraphMode
=
ipu_strategy_instance_
->
popart_options
.
virtualGraphMode
=
p
latform
::
ipu
::
VirtualGraphMode
::
Off
;
p
opart
::
VirtualGraphMode
::
Off
;
}
}
// total num IPUs = num_ipus * replica_num
// total num IPUs = num_ipus * replica_num
ipu_strategy_instance_
->
num_ipus
=
num_ipus
*
replica_num
;
ipu_strategy_instance_
->
num_ipus
=
num_ipus
*
replica_num
;
...
...
paddle/fluid/operators/ipu/ipu_runtime_op.cc
浏览文件 @
46161679
...
@@ -46,8 +46,7 @@ class IpuRuntimeOp : public framework::OperatorBase {
...
@@ -46,8 +46,7 @@ class IpuRuntimeOp : public framework::OperatorBase {
for
(
size_t
i
=
0
;
i
<
outputs
.
size
();
++
i
)
{
for
(
size_t
i
=
0
;
i
<
outputs
.
size
();
++
i
)
{
auto
*
out
=
outputs
[
i
];
auto
*
out
=
outputs
[
i
];
if
(
out
->
dims
().
size
()
==
0
)
{
if
(
out
->
dims
().
size
()
==
0
)
{
auto
tensor_dtype
=
framework
::
TransToProtoVarType
(
out
->
dtype
());
auto
sizeof_dtype
=
framework
::
DataTypeSize
(
out
->
dtype
());
auto
sizeof_dtype
=
framework
::
SizeOfType
(
tensor_dtype
);
int64_t
dim
=
out
->
memory_size
()
/
sizeof_dtype
;
int64_t
dim
=
out
->
memory_size
()
/
sizeof_dtype
;
out
->
Resize
({
dim
});
out
->
Resize
({
dim
});
VLOG
(
10
)
<<
"set ipu_runtime_op output: "
<<
output_names
[
i
]
VLOG
(
10
)
<<
"set ipu_runtime_op output: "
<<
output_names
[
i
]
...
...
paddle/fluid/platform/device/ipu/ipu_backend.cc
浏览文件 @
46161679
...
@@ -102,7 +102,7 @@ void IpuBackend::SetCustomOps(
...
@@ -102,7 +102,7 @@ void IpuBackend::SetCustomOps(
compiler_
->
SetCustomOps
(
custom_ops
);
compiler_
->
SetCustomOps
(
custom_ops
);
}
}
void
IpuBackend
::
SaveMo
lde
Proto
(
const
std
::
string
&
path
)
{
void
IpuBackend
::
SaveMo
del
Proto
(
const
std
::
string
&
path
)
{
if
(
ipu_strategy_
->
is_training
&&
is_prepared_
)
{
if
(
ipu_strategy_
->
is_training
&&
is_prepared_
)
{
executor_
->
SaveModelToHost
(
path
);
executor_
->
SaveModelToHost
(
path
);
}
else
if
(
is_compiled_
)
{
}
else
if
(
is_compiled_
)
{
...
...
paddle/fluid/platform/device/ipu/ipu_backend.h
浏览文件 @
46161679
...
@@ -74,7 +74,7 @@ class IpuBackend {
...
@@ -74,7 +74,7 @@ class IpuBackend {
void
SetCustomOps
(
const
std
::
vector
<
IpuCustomOpIdentifier
>
&
custom_ops
);
void
SetCustomOps
(
const
std
::
vector
<
IpuCustomOpIdentifier
>
&
custom_ops
);
// save compiled model to onnx
// save compiled model to onnx
void
SaveMo
lde
Proto
(
const
std
::
string
&
path
);
void
SaveMo
del
Proto
(
const
std
::
string
&
path
);
private:
private:
void
Prepare
();
void
Prepare
();
...
...
paddle/fluid/platform/device/ipu/ipu_compiler.cc
浏览文件 @
46161679
...
@@ -297,8 +297,7 @@ void Compiler::LowerConstants(const Graph* graph, const Scope* scope) {
...
@@ -297,8 +297,7 @@ void Compiler::LowerConstants(const Graph* graph, const Scope* scope) {
tensor
->
Resize
(
ddim
);
tensor
->
Resize
(
ddim
);
auto
const_data
=
std
::
unique_ptr
<
popart
::
ConstVoidData
>
();
auto
const_data
=
std
::
unique_ptr
<
popart
::
ConstVoidData
>
();
popart
::
TensorInfo
tensor_info
(
popart
::
TensorInfo
tensor_info
(
PdDataType2PopartType
(
tensor
->
dtype
()),
VarType2PopartType
(
framework
::
TransToProtoVarType
(
tensor
->
dtype
())),
shape
);
shape
);
const_data
.
reset
(
new
popart
::
ConstVoidData
(
tensor
->
data
(),
tensor_info
));
const_data
.
reset
(
new
popart
::
ConstVoidData
(
tensor
->
data
(),
tensor_info
));
popart
::
TensorId
result
=
builder_
->
aiOnnxOpset11
().
constant
(
*
const_data
);
popart
::
TensorId
result
=
builder_
->
aiOnnxOpset11
().
constant
(
*
const_data
);
...
@@ -327,8 +326,7 @@ void Compiler::LowerWeights(const Graph* graph, const Scope* scope) {
...
@@ -327,8 +326,7 @@ void Compiler::LowerWeights(const Graph* graph, const Scope* scope) {
auto
var
=
scope
->
FindVar
(
var_name
);
auto
var
=
scope
->
FindVar
(
var_name
);
if
(
var
)
{
if
(
var
)
{
auto
tensor
=
var
->
Get
<
framework
::
LoDTensor
>
();
auto
tensor
=
var
->
Get
<
framework
::
LoDTensor
>
();
auto
dtype
=
VarType2PopartType
(
auto
dtype
=
PdDataType2PopartType
(
tensor
.
dtype
());
framework
::
TransToProtoVarType
(
tensor
.
dtype
()));
auto
shape
=
std
::
vector
<
int64_t
>
();
auto
shape
=
std
::
vector
<
int64_t
>
();
for
(
size_t
i
=
0
;
i
<
tensor
.
dims
().
size
();
++
i
)
{
for
(
size_t
i
=
0
;
i
<
tensor
.
dims
().
size
();
++
i
)
{
shape
.
push_back
(
tensor
.
dims
().
at
(
i
));
shape
.
push_back
(
tensor
.
dims
().
at
(
i
));
...
...
paddle/fluid/platform/device/ipu/ipu_executor.cc
浏览文件 @
46161679
...
@@ -154,7 +154,12 @@ void Executor::AcquireDevice() {
...
@@ -154,7 +154,12 @@ void Executor::AcquireDevice() {
bool
use_ipu_model
=
GetBoolEnv
(
"POPLAR_IPUMODEL"
);
bool
use_ipu_model
=
GetBoolEnv
(
"POPLAR_IPUMODEL"
);
if
(
use_ipu_model
)
{
if
(
use_ipu_model
)
{
std
::
map
<
std
::
string
,
std
::
string
>
deviceOpts
{{
"numIPUs"
,
"1 "
}};
std
::
map
<
std
::
string
,
std
::
string
>
deviceOpts
{
{
"numIPUs"
,
std
::
to_string
(
ipu_strategy_
->
num_ipus
),
},
{
"ipuVersion"
,
"ipu2"
},
};
device_
=
popart
::
DeviceManager
::
createDeviceManager
().
createIpuModelDevice
(
device_
=
popart
::
DeviceManager
::
createDeviceManager
().
createIpuModelDevice
(
deviceOpts
);
deviceOpts
);
}
else
{
}
else
{
...
@@ -210,8 +215,8 @@ void Executor::SetWeightsIO() {
...
@@ -210,8 +215,8 @@ void Executor::SetWeightsIO() {
void
Executor
::
ConvertWeights
(
bool
align_to_popart
)
{
void
Executor
::
ConvertWeights
(
bool
align_to_popart
)
{
for
(
auto
weight_pair
:
executor_resources_
->
weights_and_opt_state
)
{
for
(
auto
weight_pair
:
executor_resources_
->
weights_and_opt_state
)
{
auto
paddle_var
=
scope_
->
GetVar
(
weight_pair
.
second
);
auto
paddle_var
=
scope_
->
GetVar
(
weight_pair
.
second
);
auto
paddle_var_dtype
=
Var
Type2PopartType
(
auto
paddle_var_dtype
=
PdData
Type2PopartType
(
paddle_var
->
GetMutable
<
framework
::
LoDTensor
>
()
->
type
());
paddle_var
->
GetMutable
<
framework
::
LoDTensor
>
()
->
d
type
());
PADDLE_ENFORCE_EQ
((
paddle_var_dtype
==
popart
::
DataType
::
FLOAT
||
PADDLE_ENFORCE_EQ
((
paddle_var_dtype
==
popart
::
DataType
::
FLOAT
||
paddle_var_dtype
==
popart
::
DataType
::
FLOAT16
),
paddle_var_dtype
==
popart
::
DataType
::
FLOAT16
),
...
...
paddle/fluid/platform/device/ipu/ipu_strategy.cc
浏览文件 @
46161679
...
@@ -13,23 +13,451 @@ See the License for the specific language governing permissions and
...
@@ -13,23 +13,451 @@ See the License for the specific language governing permissions and
limitations under the License. */
limitations under the License. */
#include "paddle/fluid/platform/device/ipu/ipu_strategy.h"
#include "paddle/fluid/platform/device/ipu/ipu_strategy.h"
#include <glog/logging.h>
namespace
{
template
<
typename
Value
,
typename
Lambda
>
void
RegisterSetter
(
std
::
map
<
std
::
string
,
std
::
function
<
void
(
Value
)
>>&
options
,
// NOLINT
const
std
::
string
&
name
,
Lambda
setter
)
{
options
[
name
]
=
setter
;
}
template
<
typename
Value
,
typename
Lambda
>
void
RegisterGetter
(
std
::
map
<
std
::
string
,
std
::
function
<
Value
()
>>&
options
,
// NOLINT
std
::
map
<
std
::
string
,
std
::
string
>&
options_type
,
// NOLINT
const
std
::
string
&
name
,
const
std
::
string
&
type_str
,
Lambda
getter
)
{
options
[
name
]
=
getter
;
options_type
[
name
]
=
type_str
;
}
}
// namespace
namespace
paddle
{
namespace
paddle
{
namespace
platform
{
namespace
platform
{
namespace
ipu
{
namespace
ipu
{
void
IpuStrategy
::
enablePattern
(
const
std
::
string
&
t
)
{
IpuStrategy
::
IpuStrategy
()
{
#define ADD_BOOL_OPTION(name) \
RegisterSetter(bool_options, #name, [&](bool value) { name = value; }); \
RegisterGetter(options_getter, options_type, #name, "bool", \
[&]() { return std::to_string(name); })
#define ADD_UINT64_OPTION(name) \
RegisterSetter(uint64_options, #name, \
[&](std::uint64_t value) { name = value; }); \
RegisterGetter(options_getter, options_type, #name, "uint64", \
[&]() { return std::to_string(name); })
#define ADD_DOUBLE_OPTION(name) \
RegisterSetter(double_options, #name, [&](double value) { name = value; }); \
RegisterGetter(options_getter, options_type, #name, "double", \
[&]() { return std::to_string(name); })
#define ADD_STRING_OPTION(name) \
RegisterSetter(string_options, #name, \
[&](const std::string& value) { name = value; }); \
RegisterGetter(options_getter, options_type, #name, "string", \
[&]() { return name; })
ADD_BOOL_OPTION
(
is_training
);
ADD_BOOL_OPTION
(
save_init_onnx
);
ADD_BOOL_OPTION
(
save_onnx_checkpoint
);
ADD_BOOL_OPTION
(
need_avg_shard
);
ADD_BOOL_OPTION
(
enable_fp16
);
ADD_UINT64_OPTION
(
num_ipus
);
ADD_UINT64_OPTION
(
batches_per_step
);
ADD_UINT64_OPTION
(
micro_batch_size
);
ADD_UINT64_OPTION
(
save_per_n_step
);
ADD_DOUBLE_OPTION
(
available_memory_proportion
);
ADD_DOUBLE_OPTION
(
loss_scaling
);
ADD_DOUBLE_OPTION
(
max_weight_norm
);
#undef ADD_STRING_OPTION
#undef ADD_DOUBLE_OPTION
#undef ADD_UINT64_OPTION
#undef ADD_BOOL_OPTION
#define ADD_POPART_ENUM_OPTION_ALIAS(name, aliased_name, EnumType) \
RegisterSetter(uint64_options, #name, [&](std::uint64_t value) { \
PADDLE_ENFORCE_LT( \
value, static_cast<std::uint64_t>(popart::EnumType::N), \
errors::InvalidArgument("Value for %s out of range", #EnumType)); \
popart_options.aliased_name = static_cast<popart::EnumType>(value); \
}); \
RegisterGetter(options_getter, options_type, #name, "uint64", [&]() { \
return std::to_string( \
static_cast<std::uint64_t>(popart_options.aliased_name)); \
})
#define ADD_POPART_BOOL_OPTION_ALIAS(name, aliased_name) \
RegisterSetter(bool_options, #name, \
[&](bool value) { popart_options.aliased_name = value; }); \
RegisterGetter(options_getter, options_type, #name, "bool", [&]() { \
return std::to_string(popart_options.aliased_name); \
})
#define ADD_POPART_UINT64_OPTION_ALIAS(name, aliased_name) \
RegisterSetter(uint64_options, #name, [&](std::uint64_t value) { \
popart_options.aliased_name = value; \
}); \
RegisterGetter(options_getter, options_type, #name, "uint64", [&]() { \
return std::to_string(popart_options.aliased_name); \
})
#define ADD_POPART_DOUBLE_OPTION_ALIAS(name, aliased_name) \
RegisterSetter(double_options, #name, \
[&](double value) { popart_options.aliased_name = value; }); \
RegisterGetter(options_getter, options_type, #name, "double", [&]() { \
return std::to_string(popart_options.aliased_name); \
})
#define ADD_POPART_STRING_OPTION_ALIAS(name, aliased_name) \
RegisterSetter(string_options, #name, [&](const std::string& value) { \
popart_options.aliased_name = value; \
}); \
RegisterGetter(options_getter, options_type, #name, "string", \
[&]() { return popart_options.aliased_name; })
#define ADD_POPART_ENUM_OPTION(name, EnumType) \
ADD_POPART_ENUM_OPTION_ALIAS(name, name, EnumType)
#define ADD_POPART_BOOL_OPTION(name) ADD_POPART_BOOL_OPTION_ALIAS(name, name)
#define ADD_POPART_UINT64_OPTION(name) \
ADD_POPART_UINT64_OPTION_ALIAS(name, name)
#define ADD_POPART_DOUBLE_OPTION(name) \
ADD_POPART_DOUBLE_OPTION_ALIAS(name, name)
#define ADD_POPART_STRING_OPTION(name) \
ADD_POPART_STRING_OPTION_ALIAS(name, name)
ADD_POPART_ENUM_OPTION
(
autodiffSettings
.
stitchStrategy
,
AutodiffStitchStrategy
);
ADD_POPART_ENUM_OPTION
(
batchSerializationSettings
.
transformContext
,
BatchSerializationTransformContext
);
ADD_POPART_ENUM_OPTION
(
batchSerializationSettings
.
method
,
BatchSerializationMethod
);
ADD_POPART_ENUM_OPTION
(
batchSerializationSettings
.
batchSchedule
,
BatchSerializationBatchSchedule
);
ADD_POPART_ENUM_OPTION
(
autoRecomputation
,
RecomputationType
);
ADD_POPART_ENUM_OPTION
(
mergeVarUpdate
,
MergeVarUpdateType
);
ADD_POPART_ENUM_OPTION
(
virtualGraphMode
,
VirtualGraphMode
);
ADD_POPART_ENUM_OPTION
(
syntheticDataMode
,
SyntheticDataMode
);
ADD_POPART_ENUM_OPTION
(
subgraphCopyingStrategy
,
SubgraphCopyingStrategy
);
ADD_POPART_ENUM_OPTION
(
accumulationAndReplicationReductionType
,
ReductionType
);
ADD_POPART_ENUM_OPTION
(
meanAccumulationAndReplicationReductionStrategy
,
MeanReductionStrategy
);
ADD_POPART_STRING_OPTION
(
logDir
);
ADD_POPART_STRING_OPTION
(
cachePath
);
ADD_POPART_STRING_OPTION
(
partialsTypeMatMuls
);
ADD_POPART_STRING_OPTION
(
customCodeletCompileFlags
);
ADD_POPART_STRING_OPTION
(
serializedPoprithmsShiftGraphsDir
);
ADD_POPART_STRING_OPTION
(
kahnTieBreaker
);
ADD_POPART_UINT64_OPTION
(
executionPhaseSettings
.
phases
);
ADD_POPART_UINT64_OPTION
(
executionPhaseSettings
.
stages
);
ADD_POPART_UINT64_OPTION
(
batchSerializationSettings
.
factor
);
ADD_POPART_UINT64_OPTION
(
firstDotOp
);
ADD_POPART_UINT64_OPTION
(
finalDotOp
);
ADD_POPART_UINT64_OPTION
(
numIOTiles
);
ADD_POPART_UINT64_OPTION
(
mergeVarUpdateMemThreshold
);
ADD_POPART_UINT64_OPTION
(
looseThresholdAtPeak
);
ADD_POPART_UINT64_OPTION
(
accumulationFactor
);
ADD_POPART_UINT64_OPTION
(
swapLimitScheduler
);
ADD_POPART_UINT64_OPTION
(
globalReplicationFactor
);
ADD_POPART_UINT64_OPTION
(
globalReplicaOffset
);
ADD_POPART_UINT64_OPTION
(
defaultPrefetchBufferingDepth
);
ADD_POPART_UINT64_OPTION
(
compilationProgressTotal
);
ADD_POPART_UINT64_OPTION
(
transitiveClosureOptimizationThreshold
);
ADD_POPART_BOOL_OPTION
(
batchSerializationSettings
.
concatOnVirtualGraphChange
);
ADD_POPART_BOOL_OPTION
(
batchSerializationSettings
.
concatOnExecutionPhaseChange
);
ADD_POPART_BOOL_OPTION
(
batchSerializationSettings
.
concatOnPipelineStageChange
);
ADD_POPART_BOOL_OPTION
(
strictOpVersions
);
ADD_POPART_BOOL_OPTION
(
opxAliasChecking
);
ADD_POPART_BOOL_OPTION
(
opxModifyChecking
);
ADD_POPART_BOOL_OPTION
(
dotOpNames
);
ADD_POPART_BOOL_OPTION
(
exportPoplarComputationGraph
);
ADD_POPART_BOOL_OPTION
(
exportPoplarVertexGraph
);
ADD_POPART_BOOL_OPTION
(
separateCallOpPdfs
);
ADD_POPART_BOOL_OPTION
(
enableOutlining
);
ADD_POPART_BOOL_OPTION
(
enableOutliningCopyCostPruning
);
ADD_POPART_BOOL_OPTION
(
rearrangeAnchorsOnHost
);
ADD_POPART_BOOL_OPTION
(
enablePrefetchDatastreams
);
ADD_POPART_BOOL_OPTION
(
enableNonStableSoftmax
);
ADD_POPART_BOOL_OPTION
(
enableReplicatedGraphs
);
ADD_POPART_BOOL_OPTION
(
enableGradientAccumulation
);
ADD_POPART_BOOL_OPTION
(
instrumentWithHardwareCycleCounter
);
ADD_POPART_BOOL_OPTION
(
enablePipelining
);
ADD_POPART_BOOL_OPTION_ALIAS
(
enable_pipelining
,
enablePipelining
);
ADD_POPART_BOOL_OPTION
(
disableGradAccumulationTensorStreams
);
ADD_POPART_BOOL_OPTION
(
compileEngine
);
ADD_POPART_BOOL_OPTION
(
constantWeights
);
ADD_POPART_BOOL_OPTION
(
enableEngineCaching
);
ADD_POPART_BOOL_OPTION
(
enableMergeExchange
);
ADD_POPART_BOOL_OPTION
(
enableFloatingPointChecks
);
ADD_POPART_BOOL_OPTION
(
enableStochasticRounding
);
ADD_POPART_BOOL_OPTION_ALIAS
(
enable_stochastic_rounding
,
enableStochasticRounding
);
ADD_POPART_BOOL_OPTION
(
explicitRecomputation
);
ADD_POPART_BOOL_OPTION
(
enableExplicitMainLoops
);
ADD_POPART_BOOL_OPTION
(
useHostCopyOps
);
ADD_POPART_BOOL_OPTION
(
aliasZeroCopy
);
ADD_POPART_BOOL_OPTION
(
delayVarUpdates
);
ADD_POPART_BOOL_OPTION
(
enableFullyConnectedPass
);
ADD_POPART_BOOL_OPTION
(
enableSerializedMatmuls
);
ADD_POPART_BOOL_OPTION
(
enableStableNorm
);
ADD_POPART_BOOL_OPTION
(
decomposeGradSum
);
ADD_POPART_BOOL_OPTION
(
enableDistributedReplicatedGraphs
);
ADD_POPART_BOOL_OPTION
(
groupHostSync
);
ADD_POPART_BOOL_OPTION
(
automaticLossScalingSettings
.
enabled
);
ADD_POPART_BOOL_OPTION
(
instrumentWithHardwareCycleCounter
);
ADD_POPART_BOOL_OPTION
(
enableSupportedDataTypeCasting
);
ADD_POPART_BOOL_OPTION
(
groupNormStridedChannelGrouping
);
ADD_POPART_BOOL_OPTION
(
scheduleNonWeightUpdateGradientConsumersEarly
);
ADD_POPART_DOUBLE_OPTION
(
outlineSequenceBreakCost
);
ADD_POPART_DOUBLE_OPTION
(
outlineThreshold
);
ADD_POPART_DOUBLE_OPTION
(
timeLimitScheduler
);
ADD_POPART_DOUBLE_OPTION
(
automaticLossScalingSettings
.
binEdgeLocation
);
ADD_POPART_DOUBLE_OPTION
(
automaticLossScalingSettings
.
thresholdUpperCountProportion
);
#undef ADD_POPART_STRING_OPTION
#undef ADD_POPART_DOUBLE_OPTION
#undef ADD_POPART_UINT64_OPTION
#undef ADD_POPART_BOOL_OPTION
#undef ADD_POPART_ENUM_OPTION
#undef ADD_POPART_STRING_OPTION_ALIAS
#undef ADD_POPART_DOUBLE_OPTION_ALIAS
#undef ADD_POPART_UINT64_OPTION_ALIAS
#undef ADD_POPART_BOOL_OPTION_ALIAS
#undef ADD_POPART_ENUM_OPTION_ALIAS
RegisterSetter
(
bool_options
,
"enable_manual_shard"
,
[
&
](
bool
value
)
{
if
(
value
)
{
popart_options
.
virtualGraphMode
=
popart
::
VirtualGraphMode
::
Manual
;
}
else
{
popart_options
.
virtualGraphMode
=
popart
::
VirtualGraphMode
::
Off
;
}
});
RegisterGetter
(
options_getter
,
options_type
,
"enable_manual_shard"
,
"bool"
,
[
&
]()
{
return
std
::
to_string
(
popart_options
.
virtualGraphMode
==
popart
::
VirtualGraphMode
::
Manual
);
});
RegisterSetter
(
bool_options
,
"enable_half_partial"
,
[
&
](
bool
value
)
{
if
(
value
)
{
popart_options
.
partialsTypeMatMuls
=
"half"
;
}
else
{
popart_options
.
partialsTypeMatMuls
=
"float"
;
}
});
RegisterGetter
(
options_getter
,
options_type
,
"enable_half_partial"
,
"bool"
,
[
&
]()
{
return
std
::
to_string
(
popart_options
.
partialsTypeMatMuls
==
"half"
);
});
RegisterSetter
(
container_options
,
"dotChecks"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
std
::
uint64_t
value
=
std
::
stoul
(
p
.
first
);
popart_options
.
dotChecks
.
insert
(
static_cast
<
popart
::
DotCheck
>
(
value
));
});
RegisterGetter
(
vector_options_getter
,
options_type
,
"dotChecks"
,
"vector"
,
[
&
]()
{
std
::
vector
<
std
::
string
>
res
;
for
(
auto
x
:
popart_options
.
dotChecks
)
{
res
.
push_back
(
std
::
to_string
(
static_cast
<
std
::
uint64_t
>
(
x
)));
}
return
res
;
});
RegisterSetter
(
container_options
,
"hardwareInstrumentations"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
std
::
uint64_t
value
=
std
::
stoul
(
p
.
first
);
popart_options
.
hardwareInstrumentations
.
insert
(
static_cast
<
popart
::
Instrumentation
>
(
value
));
});
RegisterGetter
(
vector_options_getter
,
options_type
,
"hardwareInstrumentations"
,
"vector"
,
[
&
]()
{
std
::
vector
<
std
::
string
>
res
;
for
(
auto
x
:
popart_options
.
hardwareInstrumentations
)
{
res
.
push_back
(
std
::
to_string
(
static_cast
<
std
::
uint64_t
>
(
x
)));
}
return
res
;
});
RegisterSetter
(
container_options
,
"customCodelets"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
popart_options
.
customCodelets
.
push_back
(
p
.
first
);
});
RegisterGetter
(
vector_options_getter
,
options_type
,
"customCodelets"
,
"vector"
,
[
&
]()
{
std
::
vector
<
std
::
string
>
res
;
for
(
auto
x
:
popart_options
.
customCodelets
)
{
res
.
push_back
(
x
);
}
return
res
;
});
RegisterSetter
(
container_options
,
"engineOptions"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
popart_options
.
engineOptions
.
emplace
(
p
);
});
RegisterGetter
(
map_options_getter
,
options_type
,
"engineOptions"
,
"map"
,
[
&
]()
{
return
popart_options
.
engineOptions
;
});
RegisterSetter
(
container_options
,
"reportOptions"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
popart_options
.
reportOptions
.
emplace
(
p
);
});
RegisterGetter
(
map_options_getter
,
options_type
,
"reportOptions"
,
"map"
,
[
&
]()
{
return
popart_options
.
reportOptions
;
});
RegisterSetter
(
container_options
,
"convolutionOptions"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
popart_options
.
convolutionOptions
.
emplace
(
p
);
});
RegisterGetter
(
map_options_getter
,
options_type
,
"convolutionOptions"
,
"map"
,
[
&
]()
{
return
popart_options
.
convolutionOptions
;
});
RegisterSetter
(
container_options
,
"lstmOptions"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
popart_options
.
lstmOptions
.
emplace
(
p
);
});
RegisterGetter
(
map_options_getter
,
options_type
,
"lstmOptions"
,
"map"
,
[
&
]()
{
return
popart_options
.
lstmOptions
;
});
RegisterSetter
(
container_options
,
"gclOptions"
,
[
&
](
const
std
::
pair
<
std
::
string
,
std
::
string
>&
p
)
{
popart_options
.
gclOptions
.
emplace
(
p
);
});
RegisterGetter
(
map_options_getter
,
options_type
,
"gclOptions"
,
"map"
,
[
&
]()
{
return
popart_options
.
gclOptions
;
});
}
void
IpuStrategy
::
AddBoolOption
(
const
std
::
string
&
option
,
bool
value
)
{
set
(
option
,
value
,
bool_options
,
"bool"
);
}
void
IpuStrategy
::
AddUint64Option
(
const
std
::
string
&
option
,
std
::
uint64_t
value
)
{
set
(
option
,
value
,
uint64_options
,
"uint64"
);
}
void
IpuStrategy
::
AddDoubleOption
(
const
std
::
string
&
option
,
double
value
)
{
set
(
option
,
value
,
double_options
,
"double"
);
}
void
IpuStrategy
::
AddStringOption
(
const
std
::
string
&
option
,
const
std
::
string
&
value
)
{
set
(
option
,
value
,
string_options
,
"string"
);
}
void
IpuStrategy
::
InsertStringOption
(
const
std
::
string
&
option
,
const
std
::
string
&
value
)
{
set
(
option
,
std
::
pair
<
std
::
string
,
std
::
string
>
(
value
,
""
),
container_options
,
"vector"
);
}
void
IpuStrategy
::
InsertStringPairOption
(
const
std
::
string
&
option
,
const
std
::
string
&
key
,
const
std
::
string
&
value
)
{
set
(
option
,
std
::
pair
<
std
::
string
,
std
::
string
>
(
key
,
value
),
container_options
,
"map"
);
}
void
IpuStrategy
::
SetTensorLocation
(
const
std
::
string
&
tensor
,
const
std
::
string
&
opt
,
std
::
uint64_t
value
)
{
VLOG
(
10
)
<<
"Setting "
<<
opt
<<
" to "
<<
value
<<
" for location "
<<
tensor
;
popart
::
TensorLocationSettings
*
settings
;
if
(
tensor
==
"location_activation"
)
{
settings
=
&
popart_options
.
activationTensorLocationSettings
;
}
else
if
(
tensor
==
"location_weight"
)
{
settings
=
&
popart_options
.
weightTensorLocationSettings
;
}
else
if
(
tensor
==
"location_optimizer"
)
{
settings
=
&
popart_options
.
optimizerStateTensorLocationSettings
;
}
else
if
(
tensor
==
"location_accumulator"
)
{
settings
=
&
popart_options
.
accumulatorTensorLocationSettings
;
}
else
{
PADDLE_THROW
(
platform
::
errors
::
InvalidArgument
(
"Unknown tensor location: %s"
,
tensor
));
}
if
(
opt
==
"minElementsForOffChip"
)
{
settings
->
minElementsForOffChip
=
value
;
}
else
if
(
opt
==
"minElementsForReplicatedTensorSharding"
)
{
settings
->
minElementsForReplicatedTensorSharding
=
value
;
}
else
if
(
opt
==
"onChip"
)
{
settings
->
location
.
storage
=
value
>
0
?
popart
::
TensorStorage
::
OnChip
:
popart
::
TensorStorage
::
OffChip
;
}
else
if
(
opt
==
"useReplicatedTensorSharding"
)
{
settings
->
location
.
replicatedTensorSharding
=
value
>
0
?
popart
::
ReplicatedTensorSharding
::
On
:
popart
::
ReplicatedTensorSharding
::
Off
;
}
else
if
(
opt
==
"useIOTilesToLoad"
)
{
settings
->
location
.
loadTileSet
=
value
>
0
?
popart
::
TileSet
::
IO
:
popart
::
TileSet
::
Compute
;
}
else
if
(
opt
==
"useIOTilesToStore"
)
{
settings
->
location
.
storageTileSet
=
value
>
0
?
popart
::
TileSet
::
IO
:
popart
::
TileSet
::
Compute
;
}
else
{
PADDLE_THROW
(
platform
::
errors
::
InvalidArgument
(
"Unknown option ' %s' for tensor location: %s"
,
opt
,
tensor
));
}
}
std
::
string
IpuStrategy
::
GetOption
(
const
std
::
string
&
option
)
{
return
get
(
option
,
options_getter
);
}
std
::
vector
<
std
::
string
>
IpuStrategy
::
GetVectorOption
(
const
std
::
string
&
option
)
{
return
get
(
option
,
vector_options_getter
);
}
std
::
map
<
std
::
string
,
std
::
string
>
IpuStrategy
::
GetMapOption
(
const
std
::
string
&
option
)
{
return
get
(
option
,
map_options_getter
);
}
std
::
string
IpuStrategy
::
GetOptionType
(
const
std
::
string
&
option
)
{
return
options_type
[
option
];
}
void
IpuStrategy
::
EnablePattern
(
const
std
::
string
&
t
)
{
VLOG
(
10
)
<<
"enable popart pattern: "
<<
t
;
VLOG
(
10
)
<<
"enable popart pattern: "
<<
t
;
popart_patterns
.
enablePattern
(
t
,
true
);
popart_patterns
.
enablePattern
(
t
,
true
);
}
}
void
IpuStrategy
::
d
isablePattern
(
const
std
::
string
&
t
)
{
void
IpuStrategy
::
D
isablePattern
(
const
std
::
string
&
t
)
{
VLOG
(
10
)
<<
"disable popart pattern: "
<<
t
;
VLOG
(
10
)
<<
"disable popart pattern: "
<<
t
;
popart_patterns
.
enablePattern
(
t
,
false
);
popart_patterns
.
enablePattern
(
t
,
false
);
}
}
const
bool
IpuStrategy
::
i
sPatternEnabled
(
const
std
::
string
&
t
)
{
const
bool
IpuStrategy
::
I
sPatternEnabled
(
const
std
::
string
&
t
)
{
return
popart_patterns
.
isPatternEnabled
(
t
);
return
popart_patterns
.
isPatternEnabled
(
t
);
}
}
...
...
paddle/fluid/platform/device/ipu/ipu_strategy.h
浏览文件 @
46161679
...
@@ -14,50 +14,19 @@ limitations under the License. */
...
@@ -14,50 +14,19 @@ limitations under the License. */
#pragma once
#pragma once
#include <popart/
op
.hpp>
#include <popart/
patterns/patterns
.hpp>
#include <popart/sessionoptions.hpp>
#include <popart/sessionoptions.hpp>
#include <popart/tensorlocation.hpp>
#include <popart/tensorlocation.hpp>
#include "p
opart/patterns/patterns.hpp
"
#include "p
addle/fluid/platform/enforce.h
"
namespace
paddle
{
namespace
paddle
{
namespace
platform
{
namespace
platform
{
namespace
ipu
{
namespace
ipu
{
using
VirtualGraphMode
=
popart
::
VirtualGraphMode
;
using
RecomputationType
=
popart
::
RecomputationType
;
struct
IpuStrategy
{
struct
IpuStrategy
{
IpuStrategy
()
{
IpuStrategy
();
// we always save optimizer state to OffChip and enable rts for saving
// memory
auto
storage
=
popart
::
TensorLocation
(
popart
::
TensorStorage
::
OffChip
,
popart
::
ReplicatedTensorSharding
::
On
);
popart_options
.
optimizerStateTensorLocationSettings
=
popart
::
TensorLocationSettings
(
storage
);
// We divide the accumulationFactor and replicatedGraphCount after all
// reduce
popart_options
.
accumulationAndReplicationReductionType
=
popart
::
ReductionType
::
Mean
;
popart_options
.
meanAccumulationAndReplicationReductionStrategy
=
popart
::
MeanReductionStrategy
::
Post
;
popart_options
.
enableFloatingPointChecks
=
false
;
// A directory for log traces to be written into.
popart_options
.
logDir
=
"popart_log"
;
}
~
IpuStrategy
()
{}
// Number ipus total needed, replica * ipu_per_replica
int
num_ipus
=
1
;
// batches per step
int
batches_per_step
=
1
;
// micro batch-size
int
micro_batch_size
=
1
;
// TODO(alleng) create PaddleOptions
// training flag, true for training
// training flag, true for training
bool
is_training
=
true
;
bool
is_training
=
true
;
...
@@ -67,15 +36,25 @@ struct IpuStrategy {
...
@@ -67,15 +36,25 @@ struct IpuStrategy {
// save the trained model
// save the trained model
bool
save_onnx_checkpoint
=
false
;
bool
save_onnx_checkpoint
=
false
;
// save paddle model per n steps
int
save_per_n_step
=
1
;
// average sharding, debugging used
// average sharding, debugging used
bool
need_avg_shard
=
false
;
bool
need_avg_shard
=
false
;
// flag for fp16, true for pure fp16
// flag for fp16, true for pure fp16
bool
enable_fp16
=
false
;
bool
enable_fp16
=
false
;
// Number ipus total needed, replica * ipu_per_replica
int
num_ipus
=
1
;
// batches per step
int
batches_per_step
=
1
;
// micro batch-size
int
micro_batch_size
=
1
;
// save paddle model per n steps
int
save_per_n_step
=
1
;
// TODO(alleng) remove this param
// available memory proportion, 0.0f for disable
// available memory proportion, 0.0f for disable
float
available_memory_proportion
=
0.0
f
;
float
available_memory_proportion
=
0.0
f
;
...
@@ -88,12 +67,71 @@ struct IpuStrategy {
...
@@ -88,12 +67,71 @@ struct IpuStrategy {
// popart session option
// popart session option
popart
::
SessionOptions
popart_options
;
popart
::
SessionOptions
popart_options
;
// popart pattern manager
popart
::
Patterns
popart_patterns
;
popart
::
Patterns
popart_patterns
;
private:
std
::
map
<
std
::
string
,
std
::
function
<
void
(
bool
)
>>
bool_options
;
std
::
map
<
std
::
string
,
std
::
function
<
void
(
std
::
uint64_t
)
>>
uint64_options
;
std
::
map
<
std
::
string
,
std
::
function
<
void
(
double
)
>>
double_options
;
std
::
map
<
std
::
string
,
std
::
function
<
void
(
std
::
string
)
>>
string_options
;
std
::
map
<
std
::
string
,
std
::
function
<
void
(
std
::
pair
<
std
::
string
,
std
::
string
>
)
>>
container_options
;
std
::
map
<
std
::
string
,
std
::
function
<
std
::
string
()
>>
options_getter
;
std
::
map
<
std
::
string
,
std
::
function
<
std
::
vector
<
std
::
string
>
()
>>
vector_options_getter
;
std
::
map
<
std
::
string
,
std
::
function
<
std
::
map
<
std
::
string
,
std
::
string
>
()
>>
map_options_getter
;
std
::
map
<
std
::
string
,
std
::
string
>
options_type
;
template
<
typename
ValueType
>
void
set
(
const
std
::
string
&
key
,
ValueType
value
,
std
::
map
<
std
::
string
,
std
::
function
<
void
(
ValueType
)
>>
&
options
,
// NOLINT
const
std
::
string
&
type_str
)
{
auto
it
=
options
.
find
(
key
);
PADDLE_ENFORCE_NE
(
it
,
options
.
end
(),
platform
::
errors
::
InvalidArgument
(
"Cannot find option: %s, type: %s "
"when setting IpuStrategy options"
,
key
,
type_str
));
it
->
second
(
value
);
}
template
<
typename
ValueType
>
ValueType
get
(
const
std
::
string
&
key
,
std
::
map
<
std
::
string
,
std
::
function
<
ValueType
()
>>
&
options
)
{
// NOLINT
auto
it
=
options
.
find
(
key
);
PADDLE_ENFORCE_NE
(
it
,
options
.
end
(),
platform
::
errors
::
InvalidArgument
(
"Cannot find option name: %s when trying to get IpuStrategy option"
,
key
));
return
it
->
second
();
}
public:
public:
void
enablePattern
(
const
std
::
string
&
t
);
void
AddBoolOption
(
const
std
::
string
&
option
,
bool
value
);
void
disablePattern
(
const
std
::
string
&
t
);
void
AddUint64Option
(
const
std
::
string
&
option
,
std
::
uint64_t
value
);
const
bool
isPatternEnabled
(
const
std
::
string
&
t
);
void
AddDoubleOption
(
const
std
::
string
&
option
,
double
value
);
void
AddStringOption
(
const
std
::
string
&
option
,
const
std
::
string
&
value
);
void
InsertStringOption
(
const
std
::
string
&
option
,
const
std
::
string
&
value
);
void
InsertStringPairOption
(
const
std
::
string
&
option
,
const
std
::
string
&
key
,
const
std
::
string
&
value
);
void
SetTensorLocation
(
const
std
::
string
&
tensor
,
const
std
::
string
&
option
,
std
::
uint64_t
value
);
std
::
string
GetOption
(
const
std
::
string
&
);
std
::
vector
<
std
::
string
>
GetVectorOption
(
const
std
::
string
&
);
std
::
map
<
std
::
string
,
std
::
string
>
GetMapOption
(
const
std
::
string
&
);
std
::
string
GetOptionType
(
const
std
::
string
&
);
void
EnablePattern
(
const
std
::
string
&
t
);
void
DisablePattern
(
const
std
::
string
&
t
);
const
bool
IsPatternEnabled
(
const
std
::
string
&
t
);
};
};
}
// namespace ipu
}
// namespace ipu
...
...
paddle/fluid/platform/device/ipu/ipu_utils.cc
浏览文件 @
46161679
...
@@ -22,7 +22,7 @@ namespace ipu {
...
@@ -22,7 +22,7 @@ namespace ipu {
void
*
PaddleIArray
::
data
()
{
return
tensor_
.
data
();
}
void
*
PaddleIArray
::
data
()
{
return
tensor_
.
data
();
}
popart
::
DataType
PaddleIArray
::
dataType
()
const
{
popart
::
DataType
PaddleIArray
::
dataType
()
const
{
return
VarType2PopartType
(
tensor_
.
type
());
return
PdDataType2PopartType
(
tensor_
.
d
type
());
}
}
std
::
size_t
PaddleIArray
::
rank
()
const
{
return
tensor_
.
dims
().
size
();
}
std
::
size_t
PaddleIArray
::
rank
()
const
{
return
tensor_
.
dims
().
size
();
}
...
@@ -66,11 +66,44 @@ popart::DataType VarType2PopartType(
...
@@ -66,11 +66,44 @@ popart::DataType VarType2PopartType(
case
framework
::
proto
::
VarType
::
COMPLEX128
:
case
framework
::
proto
::
VarType
::
COMPLEX128
:
return
popart
::
DataType
::
COMPLEX128
;
return
popart
::
DataType
::
COMPLEX128
;
default:
default:
PADDLE_THROW
(
paddle
::
platform
::
errors
::
Un
available
(
PADDLE_THROW
(
paddle
::
platform
::
errors
::
Un
implemented
(
"Unsupported Paddle var type."
));
"Unsupported Paddle var type."
));
}
}
}
}
popart
::
DataType
PdDataType2PopartType
(
const
paddle
::
experimental
::
DataType
type
)
{
switch
(
type
)
{
case
paddle
::
experimental
::
DataType
::
UINT8
:
return
popart
::
DataType
::
UINT8
;
case
paddle
::
experimental
::
DataType
::
INT8
:
return
popart
::
DataType
::
INT8
;
case
paddle
::
experimental
::
DataType
::
INT16
:
return
popart
::
DataType
::
INT16
;
case
paddle
::
experimental
::
DataType
::
INT32
:
return
popart
::
DataType
::
INT32
;
case
paddle
::
experimental
::
DataType
::
INT64
:
return
popart
::
DataType
::
INT64
;
case
paddle
::
experimental
::
DataType
::
BOOL
:
return
popart
::
DataType
::
BOOL
;
case
paddle
::
experimental
::
DataType
::
FLOAT64
:
return
popart
::
DataType
::
DOUBLE
;
case
paddle
::
experimental
::
DataType
::
FLOAT32
:
return
popart
::
DataType
::
FLOAT
;
case
paddle
::
experimental
::
DataType
::
FLOAT16
:
return
popart
::
DataType
::
FLOAT16
;
case
paddle
::
experimental
::
DataType
::
BFLOAT16
:
return
popart
::
DataType
::
BFLOAT16
;
case
paddle
::
experimental
::
DataType
::
COMPLEX64
:
return
popart
::
DataType
::
COMPLEX64
;
case
paddle
::
experimental
::
DataType
::
COMPLEX128
:
return
popart
::
DataType
::
COMPLEX128
;
default:
PADDLE_THROW
(
paddle
::
platform
::
errors
::
Unimplemented
(
"Unsupported Paddle data type."
));
}
}
framework
::
proto
::
VarType
::
Type
PopartType2VarType
(
framework
::
proto
::
VarType
::
Type
PopartType2VarType
(
const
popart
::
DataType
type
)
{
const
popart
::
DataType
type
)
{
switch
(
type
)
{
switch
(
type
)
{
...
...
paddle/fluid/platform/device/ipu/ipu_utils.h
浏览文件 @
46161679
...
@@ -19,6 +19,7 @@ limitations under the License. */
...
@@ -19,6 +19,7 @@ limitations under the License. */
#include <popart/tensorinfo.hpp>
#include <popart/tensorinfo.hpp>
#include <popart/vendored/any.hpp>
#include <popart/vendored/any.hpp>
#include "paddle/fluid/framework/convert_utils.h"
#include "paddle/fluid/framework/ir/graph.h"
#include "paddle/fluid/framework/ir/graph.h"
#include "paddle/fluid/framework/lod_tensor.h"
#include "paddle/fluid/framework/lod_tensor.h"
#include "paddle/fluid/framework/scope.h"
#include "paddle/fluid/framework/scope.h"
...
@@ -83,14 +84,15 @@ class PaddleIArray final : public popart::IArray {
...
@@ -83,14 +84,15 @@ class PaddleIArray final : public popart::IArray {
};
};
popart
::
DataType
VarType2PopartType
(
const
framework
::
proto
::
VarType
::
Type
type
);
popart
::
DataType
VarType2PopartType
(
const
framework
::
proto
::
VarType
::
Type
type
);
popart
::
DataType
PdDataType2PopartType
(
const
paddle
::
experimental
::
DataType
type
);
framework
::
proto
::
VarType
::
Type
PopartType2VarType
(
const
popart
::
DataType
type
);
framework
::
proto
::
VarType
::
Type
PopartType2VarType
(
const
popart
::
DataType
type
);
popart
::
DataType
OnnxDtype2PopartType
(
const
int
type
);
popart
::
DataType
OnnxDtype2PopartType
(
const
int
type
);
bool
GetBoolEnv
(
std
::
string
str
);
bool
GetBoolEnv
(
std
::
string
str
);
template
<
typename
T
>
template
<
typename
T
>
std
::
unique_ptr
<
popart
::
NDArrayWrapper
<
T
>>
Tensor2IArray
(
const
Tensor
&
tensor
)
{
std
::
unique_ptr
<
popart
::
NDArrayWrapper
<
T
>>
Tensor2IArray
(
const
Tensor
&
tensor
)
{
auto
dtype
=
auto
dtype
=
PdDataType2PopartType
(
tensor
.
dtype
());
VarType2PopartType
(
framework
::
TransToProtoVarType
(
tensor
.
dtype
()));
auto
shape
=
std
::
vector
<
int64_t
>
();
auto
shape
=
std
::
vector
<
int64_t
>
();
for
(
size_t
i
=
0
;
i
<
tensor
.
dims
().
size
();
++
i
)
{
for
(
size_t
i
=
0
;
i
<
tensor
.
dims
().
size
();
++
i
)
{
shape
.
push_back
(
tensor
.
dims
().
at
(
i
));
shape
.
push_back
(
tensor
.
dims
().
at
(
i
));
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录