Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle
提交
2aedd9db
P
Paddle
项目概览
PaddlePaddle
/
Paddle
1 年多 前同步成功
通知
2302
Star
20931
Fork
5422
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1423
列表
看板
标记
里程碑
合并请求
543
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1,423
Issue
1,423
列表
看板
标记
里程碑
合并请求
543
合并请求
543
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
2aedd9db
编写于
5月 08, 2023
作者:
zhouweiwei2014
提交者:
GitHub
5月 08, 2023
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
[BUG] fix paddle.to_tensor/Tensor.item/Tensor.numpy BF16 bug (#53567)
上级
0a59825e
变更
7
显示空白变更内容
内联
并排
Showing
7 changed file
with
73 addition
and
37 deletion
+73
-37
paddle/fluid/pybind/eager_method.cc
paddle/fluid/pybind/eager_method.cc
+1
-3
python/paddle/fluid/data_feeder.py
python/paddle/fluid/data_feeder.py
+14
-9
python/paddle/fluid/dygraph/tensor_patch_methods.py
python/paddle/fluid/dygraph/tensor_patch_methods.py
+8
-2
python/paddle/fluid/tests/unittests/test_var_base.py
python/paddle/fluid/tests/unittests/test_var_base.py
+25
-1
python/paddle/framework/framework.py
python/paddle/framework/framework.py
+2
-2
python/paddle/hapi/progressbar.py
python/paddle/hapi/progressbar.py
+0
-2
python/paddle/tensor/creation.py
python/paddle/tensor/creation.py
+23
-18
未找到文件。
paddle/fluid/pybind/eager_method.cc
浏览文件 @
2aedd9db
...
@@ -1079,13 +1079,11 @@ static PyObject* tensor__getitem_from_offset(TensorObject* self,
...
@@ -1079,13 +1079,11 @@ static PyObject* tensor__getitem_from_offset(TensorObject* self,
T b = paddle::pybind::TensorGetElement<T>(tensor, offset); \
T b = paddle::pybind::TensorGetElement<T>(tensor, offset); \
Py_intptr_t py_dims[paddle::framework::DDim::kMaxRank]; \
Py_intptr_t py_dims[paddle::framework::DDim::kMaxRank]; \
Py_intptr_t py_strides[paddle::framework::DDim::kMaxRank]; \
Py_intptr_t py_strides[paddle::framework::DDim::kMaxRank]; \
py_dims[0] = 1; \
py_strides[0] = 1; \
auto& api = pybind11::detail::npy_api::get(); \
auto& api = pybind11::detail::npy_api::get(); \
PyObject* array = api.PyArray_NewFromDescr_( \
PyObject* array = api.PyArray_NewFromDescr_( \
api.PyArray_Type_, \
api.PyArray_Type_, \
api.PyArray_DescrFromType_(numpy_dtype), \
api.PyArray_DescrFromType_(numpy_dtype), \
1
, \
0
, \
py_dims, \
py_dims, \
py_strides, \
py_strides, \
nullptr, \
nullptr, \
...
...
python/paddle/fluid/data_feeder.py
浏览文件 @
2aedd9db
...
@@ -46,10 +46,6 @@ _PADDLE_DTYPE_2_NUMPY_DTYPE = {
...
@@ -46,10 +46,6 @@ _PADDLE_DTYPE_2_NUMPY_DTYPE = {
}
}
def
copy_bits_from_float_to_uint16
(
f
):
return
struct
.
unpack
(
'<I'
,
struct
.
pack
(
'<f'
,
f
))[
0
]
>>
16
def
convert_float_to_uint16
(
data
,
data_format
=
"NCHW"
):
def
convert_float_to_uint16
(
data
,
data_format
=
"NCHW"
):
if
data
.
size
==
0
:
if
data
.
size
==
0
:
return
data
.
view
(
np
.
uint16
)
return
data
.
view
(
np
.
uint16
)
...
@@ -57,16 +53,25 @@ def convert_float_to_uint16(data, data_format="NCHW"):
...
@@ -57,16 +53,25 @@ def convert_float_to_uint16(data, data_format="NCHW"):
if
data_format
==
"NHWC"
:
if
data_format
==
"NHWC"
:
data
=
np
.
transpose
(
data
,
[
0
,
3
,
1
,
2
])
data
=
np
.
transpose
(
data
,
[
0
,
3
,
1
,
2
])
new_data
=
[]
new_data
=
np
.
vectorize
(
for
x
in
np
.
nditer
(
data
):
lambda
x
:
struct
.
unpack
(
'<I'
,
struct
.
pack
(
'<f'
,
x
))[
0
]
>>
16
,
new_data
.
append
(
np
.
uint16
(
copy_bits_from_float_to_uint16
(
x
)))
otypes
=
[
np
.
uint16
],
new_data
=
np
.
reshape
(
new_data
,
data
.
shape
).
view
(
np
.
uint16
)
)(
data
.
flat
)
new_data
=
np
.
reshape
(
new_data
,
data
.
shape
)
if
data_format
==
"NHWC"
:
if
data_format
==
"NHWC"
:
new_data
=
np
.
transpose
(
new_
output
,
[
0
,
2
,
3
,
1
])
new_data
=
np
.
transpose
(
new_
data
,
[
0
,
2
,
3
,
1
])
return
new_data
return
new_data
def
convert_uint16_to_float
(
data
):
new_data
=
np
.
vectorize
(
lambda
x
:
struct
.
unpack
(
'<f'
,
struct
.
pack
(
'<I'
,
x
<<
16
))[
0
],
otypes
=
[
np
.
float32
],
)(
data
.
flat
)
return
np
.
reshape
(
new_data
,
data
.
shape
)
def
convert_dtype
(
dtype
):
def
convert_dtype
(
dtype
):
if
isinstance
(
dtype
,
core
.
VarDesc
.
VarType
):
if
isinstance
(
dtype
,
core
.
VarDesc
.
VarType
):
if
dtype
in
_PADDLE_DTYPE_2_NUMPY_DTYPE
:
if
dtype
in
_PADDLE_DTYPE_2_NUMPY_DTYPE
:
...
...
python/paddle/fluid/dygraph/tensor_patch_methods.py
浏览文件 @
2aedd9db
...
@@ -33,7 +33,10 @@ from ..framework import (
...
@@ -33,7 +33,10 @@ from ..framework import (
)
)
from
.base
import
switch_to_static_graph
from
.base
import
switch_to_static_graph
from
.math_op_patch
import
monkey_patch_math_tensor
from
.math_op_patch
import
monkey_patch_math_tensor
from
paddle.fluid.data_feeder
import
convert_dtype
,
_PADDLE_DTYPE_2_NUMPY_DTYPE
from
paddle.fluid.data_feeder
import
(
convert_uint16_to_float
,
_PADDLE_DTYPE_2_NUMPY_DTYPE
,
)
import
paddle.utils.deprecated
as
deprecated
import
paddle.utils.deprecated
as
deprecated
import
paddle.profiler
as
profiler
import
paddle.profiler
as
profiler
from
paddle.profiler.utils
import
in_profiler_mode
from
paddle.profiler.utils
import
in_profiler_mode
...
@@ -614,7 +617,10 @@ def monkey_patch_tensor():
...
@@ -614,7 +617,10 @@ def monkey_patch_tensor():
print(x.item(0, 2)) #3.3
print(x.item(0, 2)) #3.3
"""
"""
return
self
.
_getitem_from_offset
(
*
args
).
item
()
scalar
=
self
.
_getitem_from_offset
(
*
args
)
if
scalar
.
dtype
==
np
.
uint16
:
return
convert_uint16_to_float
(
scalar
).
item
()
return
scalar
.
item
()
@
property
@
property
def
inplace_version
(
self
):
def
inplace_version
(
self
):
...
...
python/paddle/fluid/tests/unittests/test_var_base.py
浏览文件 @
2aedd9db
...
@@ -246,10 +246,12 @@ class TestVarBase(unittest.TestCase):
...
@@ -246,10 +246,12 @@ class TestVarBase(unittest.TestCase):
np
.
testing
.
assert_array_equal
(
x
.
numpy
(),
numpy_array
)
np
.
testing
.
assert_array_equal
(
x
.
numpy
(),
numpy_array
)
self
.
assertEqual
(
x
.
type
,
core
.
VarDesc
.
VarType
.
LOD_TENSOR
)
self
.
assertEqual
(
x
.
type
,
core
.
VarDesc
.
VarType
.
LOD_TENSOR
)
# test dtype
bfloat16
# test dtype
=
bfloat16
x
=
paddle
.
to_tensor
(
-
1e6
,
dtype
=
paddle
.
bfloat16
)
x
=
paddle
.
to_tensor
(
-
1e6
,
dtype
=
paddle
.
bfloat16
)
self
.
assertEqual
(
x
.
dtype
,
core
.
VarDesc
.
VarType
.
BF16
)
self
.
assertEqual
(
x
.
dtype
,
core
.
VarDesc
.
VarType
.
BF16
)
self
.
assertTrue
(
x
==
-
999424.0
)
self
.
assertTrue
(
x
==
-
999424.0
)
self
.
assertTrue
(
x
.
item
()
==
-
999424.0
)
self
.
assertTrue
(
isinstance
(
x
.
item
(),
float
))
x
=
paddle
.
to_tensor
([
-
1e6
,
-
1e6
,
-
1e6
],
dtype
=
'bfloat16'
)
x
=
paddle
.
to_tensor
([
-
1e6
,
-
1e6
,
-
1e6
],
dtype
=
'bfloat16'
)
self
.
assertEqual
(
x
.
dtype
,
core
.
VarDesc
.
VarType
.
BF16
)
self
.
assertEqual
(
x
.
dtype
,
core
.
VarDesc
.
VarType
.
BF16
)
...
@@ -266,6 +268,28 @@ class TestVarBase(unittest.TestCase):
...
@@ -266,6 +268,28 @@ class TestVarBase(unittest.TestCase):
y
.
backward
()
y
.
backward
()
self
.
assertTrue
(
x
.
grad
==
-
999424.0
*
2
)
self
.
assertTrue
(
x
.
grad
==
-
999424.0
*
2
)
# test default_type=bfloat16
paddle
.
set_default_dtype
(
'bfloat16'
)
x
=
paddle
.
to_tensor
(
-
1e6
)
self
.
assertEqual
(
x
.
dtype
,
core
.
VarDesc
.
VarType
.
BF16
)
self
.
assertTrue
(
x
==
-
999424.0
)
self
.
assertTrue
(
x
.
item
()
==
-
999424.0
)
self
.
assertTrue
(
isinstance
(
x
.
item
(),
float
))
x
=
paddle
.
to_tensor
([
-
1e6
,
-
1e6
,
-
1e6
])
self
.
assertEqual
(
x
.
dtype
,
core
.
VarDesc
.
VarType
.
BF16
)
self
.
assertTrue
(
x
[
0
]
==
-
999424.0
)
self
.
assertTrue
(
x
[
1
]
==
-
999424.0
)
self
.
assertTrue
(
x
[
2
]
==
-
999424.0
)
x
=
paddle
.
to_tensor
(
-
1e6
,
stop_gradient
=
False
)
self
.
assertEqual
(
x
.
dtype
,
core
.
VarDesc
.
VarType
.
BF16
)
self
.
assertTrue
(
x
==
-
999424.0
)
y
=
x
*
x
y
.
backward
()
self
.
assertTrue
(
x
.
grad
==
-
999424.0
*
2
)
paddle
.
set_default_dtype
(
'float32'
)
with
self
.
assertRaises
(
ValueError
):
with
self
.
assertRaises
(
ValueError
):
paddle
.
randn
([
3
,
2
,
2
]).
item
()
paddle
.
randn
([
3
,
2
,
2
]).
item
()
with
self
.
assertRaises
(
ValueError
):
with
self
.
assertRaises
(
ValueError
):
...
...
python/paddle/framework/framework.py
浏览文件 @
2aedd9db
...
@@ -40,7 +40,7 @@ def set_default_dtype(d):
...
@@ -40,7 +40,7 @@ def set_default_dtype(d):
"""
"""
if
isinstance
(
d
,
type
):
if
isinstance
(
d
,
type
):
# This branch is for
NumPy scalar types
# This branch is for
np.dtype
if
d
in
[
np
.
float16
,
np
.
float32
,
np
.
float64
]:
if
d
in
[
np
.
float16
,
np
.
float32
,
np
.
float64
]:
d
=
d
.
__name__
d
=
d
.
__name__
else
:
else
:
...
@@ -49,7 +49,7 @@ def set_default_dtype(d):
...
@@ -49,7 +49,7 @@ def set_default_dtype(d):
", but received %s"
%
d
.
__name__
", but received %s"
%
d
.
__name__
)
)
else
:
else
:
# This branch is for
np.dtype and
str
# This branch is for str
if
d
in
[
'float16'
,
'float32'
,
'float64'
,
'bfloat16'
]:
if
d
in
[
'float16'
,
'float32'
,
'float64'
,
'bfloat16'
]:
# NOTE(SigureMo): Since the np.dtype object is not an instance of
# NOTE(SigureMo): Since the np.dtype object is not an instance of
# type, so it will not be handled by the previous branch. We need
# type, so it will not be handled by the previous branch. We need
...
...
python/paddle/hapi/progressbar.py
浏览文件 @
2aedd9db
...
@@ -83,8 +83,6 @@ class ProgressBar:
...
@@ -83,8 +83,6 @@ class ProgressBar:
if
k
==
"loss"
:
if
k
==
"loss"
:
if
isinstance
(
val
,
list
):
if
isinstance
(
val
,
list
):
scalar_val
=
val
[
0
]
scalar_val
=
val
[
0
]
elif
isinstance
(
val
,
np
.
ndarray
):
scalar_val
=
val
.
item
()
else
:
else
:
scalar_val
=
val
scalar_val
=
val
if
isinstance
(
scalar_val
,
np
.
uint16
):
if
isinstance
(
scalar_val
,
np
.
uint16
):
...
...
python/paddle/tensor/creation.py
浏览文件 @
2aedd9db
...
@@ -542,18 +542,28 @@ def logspace(start, stop, num, base=10.0, dtype=None, name=None):
...
@@ -542,18 +542,28 @@ def logspace(start, stop, num, base=10.0, dtype=None, name=None):
def
_to_tensor_non_static
(
data
,
dtype
=
None
,
place
=
None
,
stop_gradient
=
True
):
def
_to_tensor_non_static
(
data
,
dtype
=
None
,
place
=
None
,
stop_gradient
=
True
):
def
_handle_tensor_dtype
(
tensor
,
dtype
):
if
dtype
:
if
convert_dtype
(
dtype
)
!=
convert_dtype
(
tensor
.
dtype
):
return
tensor
.
astype
(
convert_dtype
(
dtype
))
return
tensor
def
_handle_np_dtype
(
ndarray
,
dtype
):
if
dtype
:
if
convert_dtype
(
dtype
)
!=
convert_dtype
(
ndarray
.
dtype
):
# should not ndarray.astype('uint16') directly, data bits is wrong
if
convert_dtype
(
dtype
)
in
[
'uint16'
]:
return
convert_float_to_uint16
(
ndarray
.
astype
(
'float32'
))
else
:
return
ndarray
.
astype
(
convert_dtype
(
dtype
))
return
ndarray
if
isinstance
(
data
,
np
.
number
):
# Special case for numpy scalars
if
isinstance
(
data
,
np
.
number
):
# Special case for numpy scalars
data
=
np
.
array
(
data
)
data
=
np
.
array
(
data
)
if
not
isinstance
(
data
,
np
.
ndarray
):
if
not
isinstance
(
data
,
np
.
ndarray
):
def
_handle_dtype
(
data
,
dtype
):
if
dtype
:
if
convert_dtype
(
dtype
)
!=
convert_dtype
(
data
.
dtype
):
return
data
.
astype
(
convert_dtype
(
dtype
))
return
data
if
np
.
isscalar
(
data
)
and
not
isinstance
(
data
,
str
):
if
np
.
isscalar
(
data
)
and
not
isinstance
(
data
,
str
):
data
=
np
.
array
(
data
)
data
=
np
.
array
(
data
)
elif
isinstance
(
data
,
(
list
,
tuple
)):
elif
isinstance
(
data
,
(
list
,
tuple
)):
...
@@ -565,12 +575,12 @@ def _to_tensor_non_static(data, dtype=None, place=None, stop_gradient=True):
...
@@ -565,12 +575,12 @@ def _to_tensor_non_static(data, dtype=None, place=None, stop_gradient=True):
)
)
elif
isinstance
(
data
,
paddle
.
Tensor
)
and
not
in_dygraph_mode
():
elif
isinstance
(
data
,
paddle
.
Tensor
)
and
not
in_dygraph_mode
():
data
=
data
.
_copy_to
(
place
,
False
)
data
=
data
.
_copy_to
(
place
,
False
)
data
=
_handle_dtype
(
data
,
dtype
)
data
=
_handle_
tensor_
dtype
(
data
,
dtype
)
data
.
stop_gradient
=
stop_gradient
data
.
stop_gradient
=
stop_gradient
return
data
return
data
elif
isinstance
(
data
,
core
.
eager
.
Tensor
)
and
in_dygraph_mode
():
elif
isinstance
(
data
,
core
.
eager
.
Tensor
)
and
in_dygraph_mode
():
data
=
data
.
_copy_to
(
place
,
False
)
data
=
data
.
_copy_to
(
place
,
False
)
data
=
_handle_dtype
(
data
,
dtype
)
data
=
_handle_
tensor_
dtype
(
data
,
dtype
)
data
.
stop_gradient
=
stop_gradient
data
.
stop_gradient
=
stop_gradient
return
data
return
data
elif
isinstance
(
data
,
(
core
.
LoDTensor
,
core
.
Tensor
)):
elif
isinstance
(
data
,
(
core
.
LoDTensor
,
core
.
Tensor
)):
...
@@ -583,7 +593,7 @@ def _to_tensor_non_static(data, dtype=None, place=None, stop_gradient=True):
...
@@ -583,7 +593,7 @@ def _to_tensor_non_static(data, dtype=None, place=None, stop_gradient=True):
data
=
paddle
.
Tensor
(
data
)
data
=
paddle
.
Tensor
(
data
)
if
not
data
.
place
.
_equals
(
place
):
if
not
data
.
place
.
_equals
(
place
):
data
=
data
.
_copy_to
(
place
,
False
)
data
=
data
.
_copy_to
(
place
,
False
)
data
=
_handle_dtype
(
data
,
dtype
)
data
=
_handle_
tensor_
dtype
(
data
,
dtype
)
data
.
stop_gradient
=
stop_gradient
data
.
stop_gradient
=
stop_gradient
return
data
return
data
else
:
else
:
...
@@ -607,18 +617,13 @@ def _to_tensor_non_static(data, dtype=None, place=None, stop_gradient=True):
...
@@ -607,18 +617,13 @@ def _to_tensor_non_static(data, dtype=None, place=None, stop_gradient=True):
if
default_type
in
[
'float16'
,
'float32'
]
if
default_type
in
[
'float16'
,
'float32'
]
else
'complex128'
else
'complex128'
)
)
data
=
data
.
astype
(
default_type
)
data
=
_handle_np_dtype
(
data
,
default_type
)
# Windows default type is 'int32', while Linux/Mac is 'int64'. Unify they.
# Windows default type is 'int32', while Linux/Mac is 'int64'. Unify they.
if
data
.
dtype
in
[
'int32'
]:
if
data
.
dtype
in
[
'int32'
]:
default_type
=
"int64"
data
=
data
.
astype
(
"int64"
)
data
=
data
.
astype
(
default_type
)
if
dtype
and
convert_dtype
(
dtype
)
!=
data
.
dtype
:
if
dtype
:
if
convert_dtype
(
dtype
)
in
[
'uint16'
]:
data
=
_handle_np_dtype
(
data
,
dtype
)
# should not ndarray.astype('uint16') directly, data bits is wrong
data
=
convert_float_to_uint16
(
data
.
astype
(
'float32'
))
else
:
data
=
data
.
astype
(
convert_dtype
(
dtype
))
if
_in_eager_without_dygraph_check
()
and
isinstance
(
data
,
np
.
ndarray
):
if
_in_eager_without_dygraph_check
()
and
isinstance
(
data
,
np
.
ndarray
):
return
core
.
eager
.
Tensor
(
return
core
.
eager
.
Tensor
(
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录