Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
机器未来
Paddle
提交
9a3d8593
P
Paddle
项目概览
机器未来
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
9a3d8593
编写于
6月 18, 2021
作者:
W
Wilber
提交者:
GitHub
6月 18, 2021
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
cherry-pick .Align the code of trt under the develop and release/2.1 branch (#33631)
上级
bd3aa038
变更
5
显示空白变更内容
内联
并排
Showing
5 changed file
with
187 addition
and
201 deletion
+187
-201
paddle/fluid/inference/tensorrt/convert/elementwise_op.cc
paddle/fluid/inference/tensorrt/convert/elementwise_op.cc
+30
-1
paddle/fluid/inference/tensorrt/convert/fc_op.cc
paddle/fluid/inference/tensorrt/convert/fc_op.cc
+86
-161
paddle/fluid/inference/tensorrt/convert/flatten_op.cc
paddle/fluid/inference/tensorrt/convert/flatten_op.cc
+41
-14
paddle/fluid/inference/tensorrt/convert/reshape_op.cc
paddle/fluid/inference/tensorrt/convert/reshape_op.cc
+1
-1
paddle/fluid/inference/tensorrt/op_teller.cc
paddle/fluid/inference/tensorrt/op_teller.cc
+29
-24
未找到文件。
paddle/fluid/inference/tensorrt/convert/elementwise_op.cc
浏览文件 @
9a3d8593
...
@@ -62,6 +62,25 @@ class ElementwiseWeightOpConverter : public OpConverter {
...
@@ -62,6 +62,25 @@ class ElementwiseWeightOpConverter : public OpConverter {
0
};
0
};
TensorRTEngine
::
Weight
power_weights
{
nvinfer1
::
DataType
::
kFLOAT
,
nullptr
,
TensorRTEngine
::
Weight
power_weights
{
nvinfer1
::
DataType
::
kFLOAT
,
nullptr
,
0
};
0
};
nvinfer1
::
IShuffleLayer
*
expand_layer
=
nullptr
;
nvinfer1
::
IShuffleLayer
*
squeeze_layer
=
nullptr
;
int
dynamic_shape_offset
=
engine_
->
with_dynamic_shape
()
?
1
:
0
;
auto
input_dim
=
X
->
getDimensions
();
if
(
input_dim
.
nbDims
<
3
+
dynamic_shape_offset
)
{
nvinfer1
::
Dims
expand_shape
;
expand_shape
.
nbDims
=
3
+
dynamic_shape_offset
;
for
(
int
i
=
0
;
i
<
expand_shape
.
nbDims
;
i
++
)
{
if
(
i
<
input_dim
.
nbDims
)
{
expand_shape
.
d
[
i
]
=
input_dim
.
d
[
i
]
<
0
?
0
:
input_dim
.
d
[
i
];
}
else
{
expand_shape
.
d
[
i
]
=
1
;
}
}
expand_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
X
);
expand_layer
->
setReshapeDimensions
(
expand_shape
);
X
=
expand_layer
->
getOutput
(
0
);
}
if
(
op_type_
==
"add"
)
{
if
(
op_type_
==
"add"
)
{
nvinfer1
::
IScaleLayer
*
scale_layer
=
TRT_ENGINE_ADD_LAYER
(
nvinfer1
::
IScaleLayer
*
scale_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Scale
,
*
X
,
scale_mode
,
shift_weights
.
get
(),
engine_
,
Scale
,
*
X
,
scale_mode
,
shift_weights
.
get
(),
...
@@ -73,7 +92,17 @@ class ElementwiseWeightOpConverter : public OpConverter {
...
@@ -73,7 +92,17 @@ class ElementwiseWeightOpConverter : public OpConverter {
shift_weights
.
get
(),
power_weights
.
get
());
shift_weights
.
get
(),
power_weights
.
get
());
layer
=
scale_layer
;
layer
=
scale_layer
;
}
}
if
(
input_dim
.
nbDims
<
3
+
dynamic_shape_offset
)
{
nvinfer1
::
Dims
squeeze_shape
;
squeeze_shape
.
nbDims
=
input_dim
.
nbDims
;
for
(
int
i
=
0
;
i
<
squeeze_shape
.
nbDims
;
i
++
)
{
squeeze_shape
.
d
[
i
]
=
input_dim
.
d
[
i
]
<
0
?
0
:
input_dim
.
d
[
i
];
}
squeeze_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
(
layer
->
getOutput
(
0
)));
squeeze_layer
->
setReshapeDimensions
(
squeeze_shape
);
layer
=
static_cast
<
nvinfer1
::
ILayer
*>
(
squeeze_layer
);
}
auto
output_name
=
op_desc
.
Output
(
"Out"
)[
0
];
auto
output_name
=
op_desc
.
Output
(
"Out"
)[
0
];
RreplenishLayerAndOutput
(
layer
,
"elementwise_"
+
op_type_
,
{
output_name
},
RreplenishLayerAndOutput
(
layer
,
"elementwise_"
+
op_type_
,
{
output_name
},
test_mode
);
test_mode
);
...
...
paddle/fluid/inference/tensorrt/convert/fc_op.cc
浏览文件 @
9a3d8593
...
@@ -37,7 +37,7 @@ class FcOpConverter : public OpConverter {
...
@@ -37,7 +37,7 @@ class FcOpConverter : public OpConverter {
const
framework
::
Scope
&
scope
,
bool
test_mode
)
override
{
const
framework
::
Scope
&
scope
,
bool
test_mode
)
override
{
VLOG
(
3
)
<<
"convert a fluid fc op to tensorrt fc layer without bias"
;
VLOG
(
3
)
<<
"convert a fluid fc op to tensorrt fc layer without bias"
;
framework
::
OpDesc
op_desc
(
op
,
nullptr
);
framework
::
OpDesc
op_desc
(
op
,
nullptr
);
auto
output_name
=
op_desc
.
Output
(
"Out"
).
front
();
auto
input_names
=
op_desc
.
InputNames
();
auto
input_names
=
op_desc
.
InputNames
();
bool
with_bias
=
input_names
.
size
()
>=
3
;
bool
with_bias
=
input_names
.
size
()
>=
3
;
std
::
string
w_name
=
"Y"
;
std
::
string
w_name
=
"Y"
;
...
@@ -48,13 +48,14 @@ class FcOpConverter : public OpConverter {
...
@@ -48,13 +48,14 @@ class FcOpConverter : public OpConverter {
}
}
// Declare inputs
// Declare inputs
auto
*
X
=
engine_
->
GetITensor
(
op_desc
.
Input
(
i_name
).
front
());
auto
*
X
=
engine_
->
GetITensor
(
op_desc
.
Input
(
i_name
).
front
());
auto
x_dim
=
X
->
getDimensions
();
// Declare weights
// Declare weights
auto
*
Y_v
=
scope
.
FindVar
(
op_desc
.
Input
(
w_name
).
front
());
auto
*
Y_v
=
scope
.
FindVar
(
op_desc
.
Input
(
w_name
).
front
());
PADDLE_ENFORCE_NOT_NULL
(
PADDLE_ENFORCE_NOT_NULL
(
Y_v
,
platform
::
errors
::
NotFound
(
Y_v
,
platform
::
errors
::
NotFound
(
"Can not find %s presistale var of fc in scope."
,
w_name
));
"Can not find %s presistale var of fc in scope."
,
w_name
));
auto
*
Y_t
=
Y_v
->
GetMutable
<
framework
::
LoDTensor
>
();
auto
*
Y_t
=
Y_v
->
GetMutable
<
framework
::
LoDTensor
>
();
const
int
x_num_col_dims
=
int
x_num_col_dims
=
op_desc
.
HasAttr
(
"x_num_col_dims"
)
op_desc
.
HasAttr
(
"x_num_col_dims"
)
?
BOOST_GET_CONST
(
int
,
op_desc
.
GetAttr
(
"x_num_col_dims"
))
?
BOOST_GET_CONST
(
int
,
op_desc
.
GetAttr
(
"x_num_col_dims"
))
:
(
op_desc
.
HasAttr
(
"in_num_col_dims"
)
:
(
op_desc
.
HasAttr
(
"in_num_col_dims"
)
...
@@ -106,8 +107,8 @@ class FcOpConverter : public OpConverter {
...
@@ -106,8 +107,8 @@ class FcOpConverter : public OpConverter {
auto
regist_fc
=
[
&
](
nvinfer1
::
ITensor
*
inputs
,
int
n_output
,
auto
regist_fc
=
[
&
](
nvinfer1
::
ITensor
*
inputs
,
int
n_output
,
TensorRTEngine
::
Weight
&
weight
,
TensorRTEngine
::
Weight
&
weight
,
TensorRTEngine
::
Weight
&
bias
)
{
TensorRTEngine
::
Weight
&
bias
)
{
nvinfer1
::
ILayer
*
fc_layer
=
nullptr
;
if
(
enable_int8
)
{
if
(
enable_int8
)
{
// add conv layer
PADDLE_ENFORCE_EQ
(
PADDLE_ENFORCE_EQ
(
op_desc
.
HasAttr
(
"out_threshold"
),
true
,
op_desc
.
HasAttr
(
"out_threshold"
),
true
,
platform
::
errors
::
InvalidArgument
(
platform
::
errors
::
InvalidArgument
(
...
@@ -115,22 +116,52 @@ class FcOpConverter : public OpConverter {
...
@@ -115,22 +116,52 @@ class FcOpConverter : public OpConverter {
float
out_scale
=
float
out_scale
=
BOOST_GET_CONST
(
float
,
op_desc
.
GetAttr
(
"out_threshold"
));
BOOST_GET_CONST
(
float
,
op_desc
.
GetAttr
(
"out_threshold"
));
nvinfer1
::
DimsHW
nv_ksize
(
1
,
1
);
nvinfer1
::
DimsHW
nv_ksize
(
1
,
1
);
fc_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Convolution
,
*
inputs
,
n_output
,
auto
*
fc_layer_int8
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Convolution
,
*
inputs
,
n_output
,
nv_ksize
,
weight
.
get
(),
bias
.
get
());
nv_ksize
,
weight
.
get
(),
bias
.
get
());
engine_
->
SetTensorDynamicRange
(
fc_layer
->
getOutput
(
0
),
out_scale
);
engine_
->
SetTensorDynamicRange
(
fc_layer_int8
->
getOutput
(
0
),
out_scale
);
if
(
activation_type
==
"relu"
)
{
nvinfer1
::
IActivationLayer
*
relu_layer_int8
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Activation
,
*
(
fc_layer_int8
->
getOutput
(
0
)),
nvinfer1
::
ActivationType
::
kRELU
);
RreplenishLayerAndOutput
(
relu_layer_int8
,
"relu_after_fc_shuffle"
,
{
output_name
},
test_mode
);
}
else
{
}
else
{
fc_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
FullyConnected
,
*
inputs
,
RreplenishLayerAndOutput
(
fc_layer_int8
,
"shuffle_after_fc"
,
n_output
,
weight
.
get
(),
bias
.
get
()
);
{
output_name
},
test_mode
);
}
}
}
else
{
auto
output_name
=
op_desc
.
Output
(
"Out"
).
front
();
// add fc layer
auto
*
fc_layer_before
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
FullyConnected
,
*
inputs
,
n_output
,
weight
.
get
(),
bias
.
get
());
fc_layer_before
->
setName
(
(
"fc_layer_before(Output: "
+
output_name
+
")"
).
c_str
());
// add shuffle after fc
nvinfer1
::
Dims
reshape_after_fc_dim
;
if
(
engine_
->
use_oss
()
&&
engine_
->
with_ernie
()
&&
x_dim
.
nbDims
==
4
&&
x_dim
.
d
[
2
]
==
1
&&
x_dim
.
d
[
3
]
==
1
&&
x_num_col_dims
==
1
)
{
// If use tensorrt'oss, the x_dim and x_num_col_dims need change
reshape_after_fc_dim
.
nbDims
=
4
;
}
else
{
reshape_after_fc_dim
.
nbDims
=
x_num_col_dims
+
1
;
}
for
(
int
i
=
0
;
i
<
reshape_after_fc_dim
.
nbDims
;
i
++
)
{
reshape_after_fc_dim
.
d
[
i
]
=
0
;
}
auto
*
fc_layer_float
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
fc_layer_before
->
getOutput
(
0
));
fc_layer_float
->
setReshapeDimensions
(
reshape_after_fc_dim
);
if
(
activation_type
==
"relu"
)
{
if
(
activation_type
==
"relu"
)
{
nvinfer1
::
IActivationLayer
*
relu_layer
=
nvinfer1
::
IActivationLayer
*
relu_layer_float
=
TRT_ENGINE_ADD_LAYER
(
TRT_ENGINE_ADD_LAYER
(
engine_
,
Activation
,
*
(
fc_layer
->
getOutput
(
0
)),
engine_
,
Activation
,
*
(
fc_layer_float
->
getOutput
(
0
)),
nvinfer1
::
ActivationType
::
kRELU
);
nvinfer1
::
ActivationType
::
kRELU
);
RreplenishLayerAndOutput
(
relu_layer
,
"fc"
,
{
output_name
},
test_mode
);
RreplenishLayerAndOutput
(
relu_layer_float
,
"relu_after_fc_shuffle"
,
{
output_name
},
test_mode
);
}
else
{
}
else
{
RreplenishLayerAndOutput
(
fc_layer
,
"fc"
,
{
output_name
},
test_mode
);
RreplenishLayerAndOutput
(
fc_layer_float
,
"shuffle_after_fc"
,
{
output_name
},
test_mode
);
}
}
}
};
};
...
@@ -157,154 +188,48 @@ class FcOpConverter : public OpConverter {
...
@@ -157,154 +188,48 @@ class FcOpConverter : public OpConverter {
static_cast
<
void
*>
(
bias_data
),
static_cast
<
void
*>
(
bias_data
),
static_cast
<
size_t
>
(
bias_num
)};
static_cast
<
size_t
>
(
bias_num
)};
if
(
engine_
->
with_dynamic_shape
())
{
// Running the TRT Static Shape mode: x_num_col_dims-1
// not NCHW layout, but NLP layout with added 'x 1 x 1'
if
(
!
engine_
->
with_dynamic_shape
())
{
auto
x_dim
=
X
->
getDimensions
();
x_num_col_dims
--
;
}
// If use tensorrt'oss, the x_dim and x_num_col_dims need change
if
(
engine_
->
use_oss
()
&&
engine_
->
with_ernie
()
&&
x_dim
.
nbDims
==
4
&&
if
(
engine_
->
use_oss
()
&&
engine_
->
with_ernie
()
&&
x_dim
.
nbDims
==
4
&&
x_dim
.
d
[
2
]
==
1
&&
x_dim
.
d
[
3
]
==
1
&&
x_num_col_dims
==
2
)
{
x_dim
.
d
[
2
]
==
1
&&
x_dim
.
d
[
3
]
==
1
&&
x_num_col_dims
==
2
)
{
// fc which is just after self attention
x_num_col_dims
=
1
;
regist_fc
(
X
,
n_output
,
weight
,
bias
);
return
;
}
}
PADDLE_ENFORCE_LE
(
PADDLE_ENFORCE_GT
(
x_dim
.
nbDims
-
x_num_col_dims
,
3
,
x_dim
.
nbDims
,
x_num_col_dims
,
platform
::
errors
::
InvalidArgument
(
platform
::
errors
::
InvalidArgument
(
"Params and input dims mismatch. Paddle-TRT FC "
"Params and input dims mismatch. Paddle-TRT FC "
"converter expects x_dim.nbDims - x_num_col_dims <= 3
, but "
"converter expects x_dim.nbDims > x_num_col_dims
, but "
"x_dim.nbDims = %d, x_num_col_dims =
%d."
,
"x_dim.nbDims : %d, x_num_col_dims :
%d."
,
x_dim
.
nbDims
,
x_num_col_dims
));
x_dim
.
nbDims
,
x_num_col_dims
));
auto
output_name
=
op_desc
.
Output
(
"Out"
).
front
();
// add shuffle before fc
// add shuffle before fc
nvinfer1
::
Dims
reshape_before_fc_dim
;
nvinfer1
::
Dims
reshape_before_fc_dim
;
// padding shape "x 1 x 1"
reshape_before_fc_dim
.
nbDims
=
x_num_col_dims
+
3
;
int
padding_length
=
3
-
(
x_dim
.
nbDims
-
x_num_col_dims
);
// padding shape "* x q x 1 x 1"
reshape_before_fc_dim
.
nbDims
=
x_dim
.
nbDims
+
padding_length
;
for
(
int
i
=
0
;
i
<
reshape_before_fc_dim
.
nbDims
;
i
++
)
{
int
cur_dim_index
=
reshape_before_fc_dim
.
nbDims
-
1
;
reshape_before_fc_dim
.
d
[
i
]
=
1
;
while
(
padding_length
--
>
0
)
{
}
reshape_before_fc_dim
.
d
[
cur_dim_index
--
]
=
1
;
for
(
int
i
=
0
;
i
<
x_dim
.
nbDims
;
i
++
)
{
if
(
i
<
x_num_col_dims
)
{
reshape_before_fc_dim
.
d
[
i
]
=
0
;
}
else
{
if
(
x_dim
.
d
[
i
]
<
0
)
{
reshape_before_fc_dim
.
d
[
x_num_col_dims
]
=
-
1
;
break
;
}
}
while
(
cur_dim_index
>=
0
)
{
reshape_before_fc_dim
.
d
[
x_num_col_dims
]
*=
x_dim
.
d
[
i
];
reshape_before_fc_dim
.
d
[
cur_dim_index
--
]
=
0
;
}
}
}
auto
*
reshape_before_fc_layer
=
auto
*
reshape_before_fc_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
X
);
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
X
);
reshape_before_fc_layer
->
setReshapeDimensions
(
reshape_before_fc_dim
);
reshape_before_fc_layer
->
setReshapeDimensions
(
reshape_before_fc_dim
);
reshape_before_fc_layer
->
setName
(
reshape_before_fc_layer
->
setName
(
(
"shuffle_before_fc(Output: "
+
output_name
+
")"
).
c_str
());
(
"shuffle_before_fc(Output: "
+
output_name
+
")"
).
c_str
());
auto
*
reshape_itensor
=
reshape_before_fc_layer
->
getOutput
(
0
);
// add fc layer
auto
*
fc_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
FullyConnected
,
*
reshape_before_fc_layer
->
getOutput
(
0
),
n_output
,
weight
.
get
(),
bias
.
get
());
fc_layer
->
setName
((
"fc_layer(Output: "
+
output_name
+
")"
).
c_str
());
// add shuffle after fc
nvinfer1
::
Dims
reshape_after_fc_dim
;
reshape_after_fc_dim
.
nbDims
=
x_num_col_dims
+
1
;
for
(
int
i
=
0
;
i
<
reshape_after_fc_dim
.
nbDims
;
i
++
)
{
reshape_after_fc_dim
.
d
[
i
]
=
0
;
}
auto
*
reshape_after_fc_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
fc_layer
->
getOutput
(
0
));
reshape_after_fc_layer
->
setReshapeDimensions
(
reshape_after_fc_dim
);
if
(
activation_type
==
"relu"
)
{
reshape_after_fc_layer
->
setName
(
(
"shuffle_after_fc(Output: "
+
output_name
+
")"
).
c_str
());
nvinfer1
::
IActivationLayer
*
relu_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Activation
,
*
(
reshape_after_fc_layer
->
getOutput
(
0
)),
nvinfer1
::
ActivationType
::
kRELU
);
RreplenishLayerAndOutput
(
relu_layer
,
"relu_after_fc_shuffle"
,
{
output_name
},
test_mode
);
}
else
{
RreplenishLayerAndOutput
(
reshape_after_fc_layer
,
"shuffle_after_fc"
,
{
output_name
},
test_mode
);
}
return
;
}
// in order to handle situations in NLP models(input dims < 3,
// x_num_col_dims != 1, etc.), reshape input to perform FC correctly.
auto
*
reshape_itensor
=
X
;
int
input_dims
=
X
->
getDimensions
().
nbDims
;
auto
input_d
=
X
->
getDimensions
().
d
;
int
reshape_dim3
[
3
]
=
{
0
};
int
reshape_dim4
[
4
]
=
{
0
};
PADDLE_ENFORCE_LE
(
x_num_col_dims
,
input_dims
,
platform
::
errors
::
InvalidArgument
(
"Params and input dims mismatch. Paddle-TRT FC "
"converter expects x_num_col_dims <= input dims"
));
if
(
x_num_col_dims
==
1
)
{
if
(
input_dims
==
4
)
{
PADDLE_ENFORCE_EQ
(
input_d
[
3
],
1
,
platform
::
errors
::
InvalidArgument
(
"Invalid dimensions. When x_num_col_dims equals to 1 and input "
"dims equals to 4, the last dim of input must be 1, but got %d"
,
input_d
[
3
]));
}
if
(
enable_int8
)
{
reshape_dim3
[
0
]
=
1
;
for
(
int
i
=
0
;
i
<
3
;
i
++
)
{
reshape_dim3
[
0
]
*=
input_d
[
i
];
if
(
i
>
0
)
{
reshape_dim3
[
i
]
=
1
;
}
}
}
else
{
for
(
int
i
=
0
;
i
<
3
;
i
++
)
{
if
(
i
<
input_dims
)
{
reshape_dim3
[
i
]
=
input_d
[
i
];
}
else
{
reshape_dim3
[
i
]
=
1
;
}
}
}
nvinfer1
::
Dims3
reshape_dim
(
reshape_dim3
[
0
],
reshape_dim3
[
1
],
reshape_dim3
[
2
]);
auto
*
reshape_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
X
);
reshape_layer
->
setReshapeDimensions
(
reshape_dim
);
reshape_itensor
=
reshape_layer
->
getOutput
(
0
);
if
(
enable_int8
)
{
if
(
enable_int8
)
{
engine_
->
SetTensorDynamicRange
(
reshape_itensor
,
in_scale
);
engine_
->
SetTensorDynamicRange
(
reshape_itensor
,
in_scale
);
}
}
}
else
{
PADDLE_ENFORCE_NE
(
input_dims
,
1
,
platform
::
errors
::
InvalidArgument
(
"Invalid dimensions. When x_num_col_dims equals to "
"2, input_dims should not be 1"
));
if
(
enable_int8
)
{
for
(
int
i
=
0
;
i
<
4
;
i
++
)
{
if
(
i
==
0
)
{
reshape_dim4
[
i
]
=
input_d
[
i
];
}
else
{
reshape_dim4
[
i
]
=
1
;
if
(
i
<
input_dims
)
{
reshape_dim4
[
1
]
*=
input_d
[
i
];
}
}
}
}
else
{
for
(
int
i
=
0
;
i
<
4
;
i
++
)
{
if
(
i
<
input_dims
)
{
reshape_dim4
[
i
]
=
input_d
[
i
];
}
else
{
reshape_dim4
[
i
]
=
1
;
}
}
}
nvinfer1
::
Dims4
reshape_dim
(
reshape_dim4
[
0
],
reshape_dim4
[
1
],
reshape_dim4
[
2
],
reshape_dim4
[
3
]);
auto
*
reshape_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
X
);
reshape_layer
->
setReshapeDimensions
(
reshape_dim
);
reshape_itensor
=
reshape_layer
->
getOutput
(
0
);
if
(
enable_int8
)
{
engine_
->
SetTensorDynamicRange
(
reshape_itensor
,
in_scale
);
}
}
regist_fc
(
reshape_itensor
,
n_output
,
weight
,
bias
);
regist_fc
(
reshape_itensor
,
n_output
,
weight
,
bias
);
}
}
};
};
...
...
paddle/fluid/inference/tensorrt/convert/flatten_op.cc
浏览文件 @
9a3d8593
...
@@ -25,7 +25,7 @@ namespace inference {
...
@@ -25,7 +25,7 @@ namespace inference {
namespace
tensorrt
{
namespace
tensorrt
{
/*
/*
* FlattenOp
, only support static shape mode currently.
* FlattenOp
trt converter
*/
*/
class
FlattenOpConverter
:
public
OpConverter
{
class
FlattenOpConverter
:
public
OpConverter
{
public:
public:
...
@@ -35,21 +35,48 @@ class FlattenOpConverter : public OpConverter {
...
@@ -35,21 +35,48 @@ class FlattenOpConverter : public OpConverter {
// Declare inputs
// Declare inputs
auto
*
input
=
engine_
->
GetITensor
(
op_desc
.
Input
(
"X"
)[
0
]);
auto
*
input
=
engine_
->
GetITensor
(
op_desc
.
Input
(
"X"
)[
0
]);
int
dims
=
input
->
getDimensions
().
nbDims
;
int
dims
=
input
->
getDimensions
().
nbDims
;
nvinfer1
::
IShuffleLayer
*
layer
=
nullptr
;
if
(
!
engine_
->
with_dynamic_shape
())
{
int
dim_prod
=
1
;
int
dim_prod
=
1
;
for
(
int
i
=
0
;
i
<
dims
;
i
++
)
{
for
(
int
i
=
0
;
i
<
dims
;
i
++
)
{
int
dim_i
=
input
->
getDimensions
().
d
[
i
];
int
dim_i
=
input
->
getDimensions
().
d
[
i
];
PADDLE_ENFORCE_GT
(
PADDLE_ENFORCE_GT
(
dim_i
,
0
,
platform
::
errors
::
InvalidArgument
(
dim_i
,
0
,
platform
::
errors
::
InvalidArgument
(
"flatten input dim should be > 0, but got %d."
,
dim_i
));
"flatten input dim should be > 0, but got %d."
,
dim_i
));
dim_prod
*=
dim_i
;
dim_prod
*=
dim_i
;
}
}
nvinfer1
::
Dims
flatten_dim
;
nvinfer1
::
Dims
flatten_dim
;
flatten_dim
.
nbDims
=
1
;
flatten_dim
.
nbDims
=
1
;
flatten_dim
.
d
[
0
]
=
dim_prod
;
flatten_dim
.
d
[
0
]
=
dim_prod
;
auto
*
layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
input
);
layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
input
);
layer
->
setReshapeDimensions
(
flatten_dim
);
layer
->
setReshapeDimensions
(
flatten_dim
);
}
else
{
auto
*
shape_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shape
,
*
input
);
uint32_t
reduce_dim
=
1
;
auto
*
reduce_prod_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Reduce
,
*
(
shape_layer
->
getOutput
(
0
)),
nvinfer1
::
ReduceOperation
::
kPROD
,
reduce_dim
,
true
);
int32_t
*
constant_weight_data
=
new
int32_t
[
1
];
constant_weight_data
[
0
]
=
-
1
;
TensorRTEngine
::
Weight
constant_weight
{
nvinfer1
::
DataType
::
kINT32
,
static_cast
<
void
*>
(
constant_weight_data
),
1
};
nvinfer1
::
Dims
constant_dims
;
constant_dims
.
nbDims
=
1
;
constant_dims
.
d
[
0
]
=
1
;
auto
*
constant_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Constant
,
constant_dims
,
constant_weight
.
get
());
std
::
vector
<
nvinfer1
::
ITensor
*>
itensors
;
itensors
.
push_back
(
constant_layer
->
getOutput
(
0
));
itensors
.
push_back
(
reduce_prod_layer
->
getOutput
(
0
));
auto
*
concat_layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Concatenation
,
itensors
.
data
(),
2
);
concat_layer
->
setAxis
(
0
);
layer
=
TRT_ENGINE_ADD_LAYER
(
engine_
,
Shuffle
,
*
input
);
layer
->
setInput
(
1
,
*
(
concat_layer
->
getOutput
(
0
)));
}
auto
output_name
=
op_desc
.
Output
(
"Out"
)[
0
];
auto
output_name
=
op_desc
.
Output
(
"Out"
)[
0
];
RreplenishLayerAndOutput
(
layer
,
"flatten"
,
{
output_name
},
test_mode
);
RreplenishLayerAndOutput
(
layer
,
"flatten"
,
{
output_name
},
test_mode
);
}
}
...
...
paddle/fluid/inference/tensorrt/convert/reshape_op.cc
浏览文件 @
9a3d8593
...
@@ -34,7 +34,7 @@ class ReshapeOpConverter : public OpConverter {
...
@@ -34,7 +34,7 @@ class ReshapeOpConverter : public OpConverter {
framework
::
OpDesc
op_desc
(
op
,
nullptr
);
framework
::
OpDesc
op_desc
(
op
,
nullptr
);
// Declare inputs
// Declare inputs
auto
*
input
=
engine_
->
GetITensor
(
op_desc
.
Input
(
"X"
)[
0
]);
auto
*
input
=
engine_
->
GetITensor
(
op_desc
.
Input
(
"X"
)[
0
]);
const
std
::
vector
<
int
>&
shape
=
std
::
vector
<
int
>
shape
=
BOOST_GET_CONST
(
std
::
vector
<
int
>
,
op_desc
.
GetAttr
(
"shape"
));
BOOST_GET_CONST
(
std
::
vector
<
int
>
,
op_desc
.
GetAttr
(
"shape"
));
int
nbDims_num
=
shape
.
size
();
int
nbDims_num
=
shape
.
size
();
nvinfer1
::
Dims
reshape_dim
;
nvinfer1
::
Dims
reshape_dim
;
...
...
paddle/fluid/inference/tensorrt/op_teller.cc
浏览文件 @
9a3d8593
...
@@ -300,23 +300,14 @@ bool OpTeller::Tell(const framework::ir::Node* node, bool use_no_calib_int8,
...
@@ -300,23 +300,14 @@ bool OpTeller::Tell(const framework::ir::Node* node, bool use_no_calib_int8,
if
(
axis
.
size
()
>=
nvinfer1
::
Dims
::
MAX_DIMS
)
return
false
;
if
(
axis
.
size
()
>=
nvinfer1
::
Dims
::
MAX_DIMS
)
return
false
;
}
}
}
}
if
(
op_type
==
"flatten2"
)
{
if
(
op_type
==
"flatten2"
||
op_type
==
"flatten"
)
{
// flatten doesn't support dynamic shape currently
if
(
!
desc
.
HasAttr
(
"axis"
))
{
return
false
;
}
else
{
if
(
with_dynamic_shape
)
return
false
;
int
axis
=
BOOST_GET_CONST
(
int
,
desc
.
GetAttr
(
"axis"
));
if
(
axis
!=
1
)
return
false
;
}
}
if
(
op_type
==
"flatten"
)
{
// flatten doesn't support dynamic shape currently
if
(
!
desc
.
HasAttr
(
"axis"
))
{
if
(
!
desc
.
HasAttr
(
"axis"
))
{
return
false
;
return
false
;
}
else
{
}
else
{
#if IS_TRT_VERSION_GE(7130)
#else
if
(
with_dynamic_shape
)
return
false
;
if
(
with_dynamic_shape
)
return
false
;
#endif
int
axis
=
BOOST_GET_CONST
(
int
,
desc
.
GetAttr
(
"axis"
));
int
axis
=
BOOST_GET_CONST
(
int
,
desc
.
GetAttr
(
"axis"
));
if
(
axis
!=
1
)
return
false
;
if
(
axis
!=
1
)
return
false
;
}
}
...
@@ -685,20 +676,19 @@ bool OpTeller::Tell(const framework::ir::Node* node, bool use_no_calib_int8,
...
@@ -685,20 +676,19 @@ bool OpTeller::Tell(const framework::ir::Node* node, bool use_no_calib_int8,
}
}
}
}
if
(
op_type
==
"
reduce_sum
"
)
{
if
(
op_type
==
"
fc
"
)
{
i
f
(
!
with_dynamic_shape
)
{
i
nt
x_num_col_dims
=
VLOG
(
3
)
<<
"the reduce_sum does not support static shape yet"
;
desc
.
HasAttr
(
"x_num_col_dims"
)
return
false
;
?
BOOST_GET_CONST
(
int
,
desc
.
GetAttr
(
"x_num_col_dims"
))
}
:
(
desc
.
HasAttr
(
"in_num_col_dims"
)
?
BOOST_GET_CONST
(
int
,
desc
.
GetAttr
(
"in_num_col_dims"
))
if
(
!
(
desc
.
HasAttr
(
"keep_dim"
)
&&
desc
.
HasAttr
(
"dim"
)
&&
:
1
);
desc
.
HasAttr
(
"reduce_all"
))
)
{
if
(
x_num_col_dims
<
1
)
{
VLOG
(
3
)
<<
"
the reduce_sum does not have attr (keep_dim or dim or
"
VLOG
(
3
)
<<
"
converter expects x_num_col_dims >= 1,
"
"
reduce_all)
"
;
"
but x_num_col_dims = %d.
"
;
return
false
;
return
false
;
}
}
}
}
if
(
op_type
==
"reshape"
||
op_type
==
"reshape2"
)
{
if
(
op_type
==
"reshape"
||
op_type
==
"reshape2"
)
{
if
(
!
desc
.
HasAttr
(
"shape"
))
{
if
(
!
desc
.
HasAttr
(
"shape"
))
{
return
false
;
return
false
;
...
@@ -712,6 +702,21 @@ bool OpTeller::Tell(const framework::ir::Node* node, bool use_no_calib_int8,
...
@@ -712,6 +702,21 @@ bool OpTeller::Tell(const framework::ir::Node* node, bool use_no_calib_int8,
if
(
shape
.
size
()
>=
nvinfer1
::
Dims
::
MAX_DIMS
)
return
false
;
if
(
shape
.
size
()
>=
nvinfer1
::
Dims
::
MAX_DIMS
)
return
false
;
}
}
}
}
if
(
op_type
==
"reduce_sum"
)
{
if
(
!
with_dynamic_shape
)
{
VLOG
(
3
)
<<
"the reduce_sum does not support static shape yet"
;
return
false
;
}
if
(
!
(
desc
.
HasAttr
(
"keep_dim"
)
&&
desc
.
HasAttr
(
"dim"
)
&&
desc
.
HasAttr
(
"reduce_all"
)))
{
VLOG
(
3
)
<<
"the reduce_sum does not have attr (keep_dim or dim or "
"reduce_all)"
;
return
false
;
}
}
if
((
*
teller
)(
op_type
,
desc
,
use_no_calib_int8
))
return
true
;
if
((
*
teller
)(
op_type
,
desc
,
use_no_calib_int8
))
return
true
;
}
}
return
false
;
return
false
;
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录