Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle
提交
7ecbcc08
P
Paddle
项目概览
PaddlePaddle
/
Paddle
1 年多 前同步成功
通知
2302
Star
20931
Fork
5422
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1423
列表
看板
标记
里程碑
合并请求
543
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1,423
Issue
1,423
列表
看板
标记
里程碑
合并请求
543
合并请求
543
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
7ecbcc08
编写于
4月 14, 2023
作者:
C
chenxujun
提交者:
GitHub
4月 14, 2023
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
【Hackathon No.62】digamma, dirichlet算子FP16/BF16单测完善 (#52604)
* Add digamma, dirichlet tests * Fix code
上级
eeb4d165
变更
10
隐藏空白更改
内联
并排
Showing
10 changed file
with
203 addition
and
27 deletion
+203
-27
paddle/phi/kernels/gpu/digamma_grad_kernel.cu
paddle/phi/kernels/gpu/digamma_grad_kernel.cu
+9
-2
paddle/phi/kernels/gpu/digamma_kernel.cu
paddle/phi/kernels/gpu/digamma_kernel.cu
+9
-2
paddle/phi/kernels/gpu/dirichlet_kernel.cu
paddle/phi/kernels/gpu/dirichlet_kernel.cu
+8
-2
paddle/phi/kernels/impl/digamma_grad_kernel_impl.h
paddle/phi/kernels/impl/digamma_grad_kernel_impl.h
+6
-1
paddle/phi/kernels/impl/digamma_kernel_impl.h
paddle/phi/kernels/impl/digamma_kernel_impl.h
+4
-1
paddle/phi/kernels/impl/dirichlet_kernel_impl.h
paddle/phi/kernels/impl/dirichlet_kernel_impl.h
+26
-15
python/paddle/distribution/dirichlet.py
python/paddle/distribution/dirichlet.py
+4
-1
python/paddle/fluid/tests/unittests/distribution/test_dirichlet_op.py
...e/fluid/tests/unittests/distribution/test_dirichlet_op.py
+95
-1
python/paddle/fluid/tests/unittests/test_digamma_op.py
python/paddle/fluid/tests/unittests/test_digamma_op.py
+39
-1
python/paddle/tensor/math.py
python/paddle/tensor/math.py
+3
-1
未找到文件。
paddle/phi/kernels/gpu/digamma_grad_kernel.cu
浏览文件 @
7ecbcc08
...
...
@@ -15,9 +15,16 @@
#include "paddle/phi/kernels/digamma_grad_kernel.h"
#include "paddle/phi/backends/gpu/gpu_context.h"
#include "paddle/phi/common/amp_type_traits.h"
#include "paddle/phi/core/dense_tensor.h"
#include "paddle/phi/core/kernel_registry.h"
#include "paddle/phi/kernels/impl/digamma_grad_kernel_impl.h"
PD_REGISTER_KERNEL
(
digamma_grad
,
GPU
,
ALL_LAYOUT
,
phi
::
DigammaGradKernel
,
float
,
double
)
{}
PD_REGISTER_KERNEL
(
digamma_grad
,
GPU
,
ALL_LAYOUT
,
phi
::
DigammaGradKernel
,
float
,
double
,
phi
::
dtype
::
float16
,
phi
::
dtype
::
bfloat16
)
{}
paddle/phi/kernels/gpu/digamma_kernel.cu
浏览文件 @
7ecbcc08
...
...
@@ -15,10 +15,17 @@
#include "paddle/phi/kernels/digamma_kernel.h"
#include "paddle/phi/backends/gpu/gpu_context.h"
#include "paddle/phi/common/amp_type_traits.h"
#include "paddle/phi/common/scalar.h"
#include "paddle/phi/core/dense_tensor.h"
#include "paddle/phi/core/kernel_registry.h"
#include "paddle/phi/kernels/impl/digamma_kernel_impl.h"
PD_REGISTER_KERNEL
(
digamma
,
GPU
,
ALL_LAYOUT
,
phi
::
DigammaKernel
,
float
,
double
)
{}
PD_REGISTER_KERNEL
(
digamma
,
GPU
,
ALL_LAYOUT
,
phi
::
DigammaKernel
,
float
,
double
,
phi
::
dtype
::
float16
,
phi
::
dtype
::
bfloat16
)
{}
paddle/phi/kernels/gpu/dirichlet_kernel.cu
浏览文件 @
7ecbcc08
...
...
@@ -112,5 +112,11 @@ struct DirichletSampler<GPUContext, T> {
};
}
// namespace phi
PD_REGISTER_KERNEL
(
dirichlet
,
GPU
,
ALL_LAYOUT
,
phi
::
Dirichletkernel
,
float
,
double
)
{}
PD_REGISTER_KERNEL
(
dirichlet
,
GPU
,
ALL_LAYOUT
,
phi
::
Dirichletkernel
,
float
,
double
,
phi
::
dtype
::
float16
,
phi
::
dtype
::
bfloat16
)
{}
paddle/phi/kernels/impl/digamma_grad_kernel_impl.h
浏览文件 @
7ecbcc08
...
...
@@ -16,6 +16,7 @@
#include <unsupported/Eigen/SpecialFunctions>
#include "paddle/phi/common/amp_type_traits.h"
#include "paddle/phi/core/dense_tensor.h"
#include "paddle/phi/kernels/funcs/for_range.h"
...
...
@@ -27,7 +28,11 @@ struct DigammaGradFunctor {
:
dout_
(
dout
),
x_
(
x
),
output_
(
output
),
numel_
(
numel
)
{}
HOSTDEVICE
void
operator
()(
int64_t
idx
)
const
{
output_
[
idx
]
=
dout_
[
idx
]
*
Eigen
::
numext
::
polygamma
(
T
(
1
),
x_
[
idx
]);
using
MPType
=
typename
phi
::
dtype
::
MPTypeTrait
<
T
>::
Type
;
const
MPType
mp_dout
=
static_cast
<
MPType
>
(
dout_
[
idx
]);
const
MPType
mp_x
=
static_cast
<
MPType
>
(
x_
[
idx
]);
output_
[
idx
]
=
static_cast
<
T
>
(
mp_dout
*
Eigen
::
numext
::
polygamma
(
MPType
(
1
),
mp_x
));
}
private:
...
...
paddle/phi/kernels/impl/digamma_kernel_impl.h
浏览文件 @
7ecbcc08
...
...
@@ -16,6 +16,7 @@
#include <unsupported/Eigen/SpecialFunctions>
#include "paddle/phi/common/amp_type_traits.h"
#include "paddle/phi/core/dense_tensor.h"
#include "paddle/phi/kernels/funcs/for_range.h"
...
...
@@ -27,7 +28,9 @@ struct DigammaFunctor {
:
input_
(
input
),
output_
(
output
),
numel_
(
numel
)
{}
HOSTDEVICE
void
operator
()(
int64_t
idx
)
const
{
output_
[
idx
]
=
Eigen
::
numext
::
digamma
(
input_
[
idx
]);
using
MPType
=
typename
phi
::
dtype
::
MPTypeTrait
<
T
>::
Type
;
const
MPType
mp_input
=
static_cast
<
MPType
>
(
input_
[
idx
]);
output_
[
idx
]
=
static_cast
<
T
>
(
Eigen
::
numext
::
digamma
(
mp_input
));
}
private:
...
...
paddle/phi/kernels/impl/dirichlet_kernel_impl.h
浏览文件 @
7ecbcc08
...
...
@@ -16,6 +16,7 @@
#include <cmath>
#include <random>
#include "paddle/phi/common/amp_type_traits.h"
#include "paddle/phi/kernels/dirichlet_kernel.h"
// ROCM hcc doesn't work well with using std:: in kernel functions
...
...
@@ -47,7 +48,10 @@ template <typename ScalarT, typename SamplerT>
struct
BaseSampler
{
SamplerT
sampler_
;
HOSTDEVICE
BaseSampler
(
const
SamplerT
&
sampler
)
:
sampler_
(
sampler
)
{}
HOSTDEVICE
ScalarT
sample
()
{
return
sampler_
();
}
HOSTDEVICE
ScalarT
sample
()
{
// Sometimes convert float to float16/bfloat16
return
static_cast
<
ScalarT
>
(
sampler_
());
}
};
// `sample_gamma` is d from Numpy's distributions.c, and add support for
...
...
@@ -83,33 +87,40 @@ HOSTDEVICE ScalarT
sample_gamma
(
ScalarT
alpha
,
BaseSampler
<
AccscalarT
,
UniformSamplerT
>
standard_uniform
,
BaseSampler
<
AccscalarT
,
NormalSamplerT
>
standard_normal
)
{
AccscalarT
scale
=
1.0
f
;
using
MPTypeScalar
=
typename
phi
::
dtype
::
MPTypeTrait
<
ScalarT
>::
Type
;
using
MPTypeAccscalar
=
typename
phi
::
dtype
::
MPTypeTrait
<
AccscalarT
>::
Type
;
MPTypeAccscalar
mp_scale
=
static_cast
<
MPTypeAccscalar
>
(
1.0
f
);
MPTypeScalar
mp_alpha
=
static_cast
<
MPTypeScalar
>
(
alpha
);
// Boost alpha for higher acceptance probability.
if
(
alpha
<
1.0
f
)
{
if
(
alpha
==
0.
f
)
return
0.
f
;
scale
*=
COMPAT_POW
(
1
-
standard_uniform
.
sample
(),
1.0
f
/
alpha
);
alpha
+=
1.0
f
;
if
(
mp_alpha
<
1.0
f
)
{
if
(
mp_alpha
==
0.
f
)
return
static_cast
<
ScalarT
>
(
0.
f
);
MPTypeAccscalar
mp_sample
=
static_cast
<
MPTypeAccscalar
>
(
standard_uniform
.
sample
());
mp_scale
*=
COMPAT_POW
(
1
-
mp_sample
,
1.0
f
/
mp_alpha
);
mp_alpha
+=
1.0
f
;
}
// This implements the acceptance-rejection method of Marsaglia and Tsang
// (2000)
// doi:10.1145/358407.358414
const
AccscalarT
d
=
alpha
-
1.0
f
/
3.0
f
;
const
AccscalarT
c
=
1.0
f
/
COMPAT_SQRT
(
9.0
f
*
d
);
const
MPTypeAccscalar
d
=
mp_
alpha
-
1.0
f
/
3.0
f
;
const
MPTypeAccscalar
c
=
1.0
f
/
COMPAT_SQRT
(
9.0
f
*
d
);
for
(;;)
{
AccscalarT
x
,
y
;
MPTypeAccscalar
x
,
y
;
do
{
x
=
sta
ndard_normal
.
sample
(
);
x
=
sta
tic_cast
<
MPTypeAccscalar
>
(
standard_normal
.
sample
()
);
y
=
1.0
f
+
c
*
x
;
}
while
(
y
<=
0
);
const
AccscalarT
v
=
y
*
y
*
y
;
const
AccscalarT
u
=
1
-
standard_uniform
.
sample
();
const
AccscalarT
xx
=
x
*
x
;
const
MPTypeAccscalar
v
=
y
*
y
*
y
;
const
MPTypeAccscalar
u
=
1
-
static_cast
<
MPTypeAccscalar
>
(
standard_uniform
.
sample
());
const
MPTypeAccscalar
xx
=
x
*
x
;
if
(
u
<
1.0
f
-
0.0331
f
*
xx
*
xx
)
return
static_cast
<
ScalarT
>
(
scale
*
d
*
v
);
return
static_cast
<
ScalarT
>
(
mp_
scale
*
d
*
v
);
if
(
COMPAT_LOG
(
u
)
<
0.5
f
*
xx
+
d
*
(
1.0
f
-
v
+
COMPAT_LOG
(
v
)))
return
static_cast
<
ScalarT
>
(
scale
*
d
*
v
);
return
static_cast
<
ScalarT
>
(
mp_
scale
*
d
*
v
);
}
}
...
...
python/paddle/distribution/dirichlet.py
浏览文件 @
7ecbcc08
...
...
@@ -164,7 +164,10 @@ def _dirichlet(concentration, name=None):
else
:
op_type
=
'dirichlet'
check_variable_and_dtype
(
concentration
,
'concentration'
,
[
'float32'
,
'float64'
],
op_type
concentration
,
'concentration'
,
[
'float16'
,
'float32'
,
'float64'
,
'uint16'
],
op_type
,
)
helper
=
LayerHelper
(
op_type
,
**
locals
())
out
=
helper
.
create_variable_for_type_inference
(
...
...
python/paddle/fluid/tests/unittests/distribution/test_dirichlet_op.py
浏览文件 @
7ecbcc08
...
...
@@ -20,7 +20,15 @@ import scipy.stats
import
paddle
sys
.
path
.
append
(
"../"
)
from
eager_op_test
import
OpTest
import
unittest
from
eager_op_test
import
(
OpTest
,
convert_float_to_uint16
,
convert_uint16_to_float
,
)
from
paddle.fluid
import
core
paddle
.
enable_static
()
...
...
@@ -52,3 +60,89 @@ class TestDirichletOp(OpTest):
)[
0
],
0.01
,
)
class
TestDirichletFP16Op
(
OpTest
):
# Because dirichlet random sample have not gradient, we skip gradient check.
no_need_check_grad
=
True
def
setUp
(
self
):
self
.
op_type
=
"dirichlet"
self
.
alpha
=
np
.
array
((
1.0
,
2.0
))
self
.
sample_shape
=
(
100000
,
2
)
self
.
dtype
=
np
.
float16
self
.
inputs
=
{
'Alpha'
:
np
.
broadcast_to
(
self
.
alpha
,
self
.
sample_shape
).
astype
(
self
.
dtype
)
}
self
.
attrs
=
{}
self
.
outputs
=
{
'Out'
:
np
.
zeros
(
self
.
sample_shape
).
astype
(
self
.
dtype
)}
def
test_check_output
(
self
):
self
.
check_output_customized
(
self
.
_hypothesis_testing
)
def
_hypothesis_testing
(
self
,
outs
):
self
.
assertEqual
(
outs
[
0
].
shape
,
self
.
sample_shape
)
self
.
assertTrue
(
np
.
all
(
outs
[
0
]
>
0.0
))
self
.
assertLess
(
scipy
.
stats
.
kstest
(
outs
[
0
][:,
0
],
# scipy dirichlet have not cdf, use beta to replace it.
scipy
.
stats
.
beta
(
a
=
self
.
alpha
[
0
],
b
=
self
.
alpha
[
1
]).
cdf
,
)[
0
],
0.01
,
)
@
unittest
.
skipIf
(
not
core
.
is_compiled_with_cuda
()
or
not
core
.
is_bfloat16_supported
(
core
.
CUDAPlace
(
0
)),
"core is not complied with CUDA and not support the bfloat16"
,
)
class
TestDirichletBF16Op
(
OpTest
):
# Because dirichlet random sample have not gradient, we skip gradient check.
no_need_check_grad
=
True
def
setUp
(
self
):
self
.
op_type
=
"dirichlet"
self
.
alpha
=
np
.
array
((
1.0
,
2.0
))
self
.
sample_shape
=
(
10000
,
2
)
self
.
dtype
=
np
.
uint16
self
.
np_dtype
=
np
.
float32
self
.
inputs
=
{
'Alpha'
:
np
.
broadcast_to
(
self
.
alpha
,
self
.
sample_shape
).
astype
(
self
.
np_dtype
)
}
self
.
attrs
=
{}
self
.
outputs
=
{
'Out'
:
np
.
zeros
(
self
.
sample_shape
).
astype
(
self
.
np_dtype
)
}
self
.
inputs
[
'Alpha'
]
=
convert_float_to_uint16
(
self
.
inputs
[
'Alpha'
])
self
.
outputs
[
'Out'
]
=
convert_float_to_uint16
(
self
.
outputs
[
'Out'
])
self
.
place
=
core
.
CUDAPlace
(
0
)
def
test_check_output
(
self
):
self
.
check_output_with_place_customized
(
self
.
_hypothesis_testing
,
place
=
core
.
CUDAPlace
(
0
)
)
def
_hypothesis_testing
(
self
,
outs
):
outs
=
convert_uint16_to_float
(
outs
)
self
.
assertEqual
(
outs
[
0
].
shape
,
self
.
sample_shape
)
self
.
assertTrue
(
np
.
all
(
outs
[
0
]
>
0.0
))
self
.
assertLess
(
scipy
.
stats
.
kstest
(
outs
[
0
][:,
0
],
# scipy dirichlet have not cdf, use beta to replace it.
scipy
.
stats
.
beta
(
a
=
self
.
alpha
[
0
],
b
=
self
.
alpha
[
1
]).
cdf
,
)[
0
],
0.3
,
# The bfloat16 test difference is below 0.3
)
if
__name__
==
'__main__'
:
unittest
.
main
()
python/paddle/fluid/tests/unittests/test_digamma_op.py
浏览文件 @
7ecbcc08
...
...
@@ -15,11 +15,12 @@
import
unittest
import
numpy
as
np
from
eager_op_test
import
OpTest
from
eager_op_test
import
OpTest
,
convert_float_to_uint16
from
scipy.special
import
psi
import
paddle
from
paddle
import
fluid
,
static
from
paddle.fluid
import
core
class
TestDigammaOp
(
OpTest
):
...
...
@@ -55,6 +56,43 @@ class TestDigammaOpFp32(TestDigammaOp):
self
.
check_grad
([
'X'
],
'Out'
)
class
TestDigammaFP16Op
(
TestDigammaOp
):
def
init_dtype_type
(
self
):
self
.
dtype
=
np
.
float16
@
unittest
.
skipIf
(
not
core
.
is_compiled_with_cuda
()
or
not
core
.
is_bfloat16_supported
(
core
.
CUDAPlace
(
0
)),
"core is not compiled with CUDA or not support bfloat16"
,
)
class
TestDigammaBF16Op
(
OpTest
):
def
setUp
(
self
):
# switch to static
paddle
.
enable_static
()
self
.
op_type
=
'digamma'
self
.
python_api
=
paddle
.
digamma
self
.
init_dtype_type
()
shape
=
(
5
,
32
)
data
=
np
.
random
.
random
(
shape
).
astype
(
self
.
np_dtype
)
+
1
self
.
inputs
=
{
'X'
:
convert_float_to_uint16
(
data
)}
result
=
np
.
ones
(
shape
).
astype
(
self
.
np_dtype
)
result
=
psi
(
data
)
self
.
outputs
=
{
'Out'
:
convert_float_to_uint16
(
result
)}
def
init_dtype_type
(
self
):
self
.
dtype
=
np
.
uint16
self
.
np_dtype
=
np
.
float32
def
test_check_output
(
self
):
# bfloat16 needs to set the parameter place
self
.
check_output_with_place
(
core
.
CUDAPlace
(
0
))
def
test_check_grad_normal
(
self
):
self
.
check_grad_with_place
(
core
.
CUDAPlace
(
0
),
[
'X'
],
'Out'
)
class
TestDigammaAPI
(
unittest
.
TestCase
):
def
setUp
(
self
):
# switch to static
...
...
python/paddle/tensor/math.py
浏览文件 @
7ecbcc08
...
...
@@ -4041,7 +4041,9 @@ def digamma(x, name=None):
if
in_dygraph_mode
():
return
_C_ops
.
digamma
(
x
)
else
:
check_variable_and_dtype
(
x
,
'x'
,
[
'float32'
,
'float64'
],
'digamma'
)
check_variable_and_dtype
(
x
,
'x'
,
[
'float16'
,
'float32'
,
'float64'
,
'uint16'
],
'digamma'
)
helper
=
LayerHelper
(
'digamma'
,
**
locals
())
out
=
helper
.
create_variable_for_type_inference
(
x
.
dtype
)
helper
.
append_op
(
type
=
'digamma'
,
inputs
=
{
'X'
:
x
},
outputs
=
{
'Out'
:
out
})
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录