Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
Crayon鑫
Paddle
提交
1b0c5ef2
P
Paddle
项目概览
Crayon鑫
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
1b0c5ef2
编写于
6月 21, 2021
作者:
P
Pei Yang
提交者:
GitHub
6月 21, 2021
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
fix emb_eltwise_ln gpu_id bug (#33701)
上级
773aabc7
变更
5
显示空白变更内容
内联
并排
Showing
5 changed file
with
4 addition
and
10 deletion
+4
-10
paddle/fluid/inference/api/analysis_config.cc
paddle/fluid/inference/api/analysis_config.cc
+0
-1
paddle/fluid/inference/api/analysis_predictor.cc
paddle/fluid/inference/api/analysis_predictor.cc
+2
-2
paddle/fluid/inference/api/paddle_analysis_config.h
paddle/fluid/inference/api/paddle_analysis_config.h
+1
-1
paddle/fluid/inference/tensorrt/plugin/emb_eltwise_layernorm_plugin.cu
...inference/tensorrt/plugin/emb_eltwise_layernorm_plugin.cu
+1
-1
paddle/fluid/inference/tests/api/trt_dynamic_shape_ernie_test.cc
...fluid/inference/tests/api/trt_dynamic_shape_ernie_test.cc
+0
-5
未找到文件。
paddle/fluid/inference/api/analysis_config.cc
浏览文件 @
1b0c5ef2
...
@@ -421,7 +421,6 @@ void AnalysisConfig::Update() {
...
@@ -421,7 +421,6 @@ void AnalysisConfig::Update() {
pass_builder
()
->
AppendPass
(
pass
);
pass_builder
()
->
AppendPass
(
pass
);
}
}
}
}
LOG
(
INFO
)
<<
"use_dlnne_:"
<<
use_dlnne_
<<
std
::
endl
;
if
(
use_dlnne_
)
{
if
(
use_dlnne_
)
{
pass_builder
()
->
ClearPasses
();
pass_builder
()
->
ClearPasses
();
for
(
const
auto
&
pass
:
kDlnneSubgraphPasses
)
{
for
(
const
auto
&
pass
:
kDlnneSubgraphPasses
)
{
...
...
paddle/fluid/inference/api/analysis_predictor.cc
浏览文件 @
1b0c5ef2
...
@@ -152,7 +152,7 @@ bool AnalysisPredictor::Init(
...
@@ -152,7 +152,7 @@ bool AnalysisPredictor::Init(
:
platform
::
ProfilerState
::
kCPU
;
:
platform
::
ProfilerState
::
kCPU
;
platform
::
EnableProfiler
(
tracking_device
);
platform
::
EnableProfiler
(
tracking_device
);
}
else
{
}
else
{
LOG
(
INFO
)
<<
"Profiler is deactivated, and no profiling report will be "
VLOG
(
2
)
<<
"Profiler is deactivated, and no profiling report will be "
"generated."
;
"generated."
;
}
}
...
...
paddle/fluid/inference/api/paddle_analysis_config.h
浏览文件 @
1b0c5ef2
...
@@ -315,7 +315,7 @@ struct PD_INFER_DECL AnalysisConfig {
...
@@ -315,7 +315,7 @@ struct PD_INFER_DECL AnalysisConfig {
/// workspace.
/// workspace.
/// \param max_batch_size The maximum batch size of this prediction task,
/// \param max_batch_size The maximum batch size of this prediction task,
/// better set as small as possible for less performance loss.
/// better set as small as possible for less performance loss.
/// \param min_subgr
pa
h_size The minimum TensorRT subgraph size needed, if a
/// \param min_subgr
ap
h_size The minimum TensorRT subgraph size needed, if a
/// subgraph is smaller than this, it will not be transferred to TensorRT
/// subgraph is smaller than this, it will not be transferred to TensorRT
/// engine.
/// engine.
/// \param precision The precision used in TensorRT.
/// \param precision The precision used in TensorRT.
...
...
paddle/fluid/inference/tensorrt/plugin/emb_eltwise_layernorm_plugin.cu
浏览文件 @
1b0c5ef2
...
@@ -134,7 +134,7 @@ int EmbEltwiseLayernormPluginDynamicImpl<T>::enqueue(
...
@@ -134,7 +134,7 @@ int EmbEltwiseLayernormPluginDynamicImpl<T>::enqueue(
int
batch
=
id_dims
.
d
[
0
];
int
batch
=
id_dims
.
d
[
0
];
int
seq_len
=
id_dims
.
d
[
1
];
int
seq_len
=
id_dims
.
d
[
1
];
int
input_num
=
embs_
.
size
();
int
input_num
=
embs_
.
size
();
cudaGetDevice
(
&
device_id_
);
auto
in_ptr_gpu_d
=
auto
in_ptr_gpu_d
=
in_ptr_tensor_
.
mutable_data
<
int64_t
>
(
platform
::
CUDAPlace
(
device_id_
));
in_ptr_tensor_
.
mutable_data
<
int64_t
>
(
platform
::
CUDAPlace
(
device_id_
));
auto
emb_ptr_gpu_d
=
auto
emb_ptr_gpu_d
=
...
...
paddle/fluid/inference/tests/api/trt_dynamic_shape_ernie_test.cc
浏览文件 @
1b0c5ef2
...
@@ -29,11 +29,6 @@ void run(const AnalysisConfig& config, std::vector<float>* out_data) {
...
@@ -29,11 +29,6 @@ void run(const AnalysisConfig& config, std::vector<float>* out_data) {
int
run_batch
=
1
;
int
run_batch
=
1
;
const
int
run_seq_len
=
128
;
const
int
run_seq_len
=
128
;
std
::
vector
<
int64_t
>
tmp_input
;
std
::
vector
<
float
>
tmp_four_input
;
tmp_input
.
reserve
(
run_batch
*
run_seq_len
);
tmp_four_input
.
reserve
(
run_batch
*
run_seq_len
);
int64_t
i0
[
run_seq_len
]
=
{
int64_t
i0
[
run_seq_len
]
=
{
1
,
3558
,
4
,
75
,
491
,
89
,
340
,
313
,
93
,
4
,
255
,
10
,
75
,
321
,
1
,
3558
,
4
,
75
,
491
,
89
,
340
,
313
,
93
,
4
,
255
,
10
,
75
,
321
,
4095
,
1902
,
4
,
134
,
49
,
75
,
311
,
14
,
44
,
178
,
543
,
15
,
12043
,
2
,
4095
,
1902
,
4
,
134
,
49
,
75
,
311
,
14
,
44
,
178
,
543
,
15
,
12043
,
2
,
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录