Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
Oneflow-Inc
oneflow
提交
e6ed2355
O
oneflow
项目概览
Oneflow-Inc
/
oneflow
上一次同步 接近 3 年
通知
13
Star
2733
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
O
oneflow
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
体验新版 GitCode,发现更多精彩内容 >>
提交
e6ed2355
编写于
1月 15, 2021
作者:
S
simonJJJ
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
add testcase
Former-commit-id: b17a045f14c71870cbd31ad388e574bcec089c0f
上级
ecf7a7f8
变更
1
隐藏空白更改
内联
并排
Showing
1 changed file
with
73 addition
and
0 deletion
+73
-0
oneflow/python/test/ops/test_optimizers.py
oneflow/python/test/ops/test_optimizers.py
+73
-0
未找到文件。
oneflow/python/test/ops/test_optimizers.py
浏览文件 @
e6ed2355
...
...
@@ -473,6 +473,68 @@ def compare_with_tensorflow_sgd(
assert
np
.
allclose
(
x
.
flatten
(),
var
.
numpy
().
flatten
(),
rtol
=
1e-4
,
atol
=
1e-4
,)
def
compare_with_tensorflow_sgd_secondary_lr
(
device_type
,
x_shape
,
momentum
,
primary_lr
,
secondary_lr
,
train_iters
):
assert
device_type
in
[
"gpu"
,
"cpu"
]
flow
.
clear_default_session
()
func_config
=
flow
.
FunctionConfig
()
func_config
.
default_data_type
(
flow
.
float32
)
@
flow
.
global_function
(
type
=
"train"
,
function_config
=
func_config
)
def
testSGD
(
random_mask
:
flow
.
typing
.
Numpy
.
Placeholder
(
x_shape
,
dtype
=
flow
.
float32
)
)
->
flow
.
typing
.
Numpy
:
with
flow
.
scope
.
placement
(
device_type
,
"0:0-0"
):
x
=
flow
.
get_variable
(
name
=
"x"
,
shape
=
x_shape
,
dtype
=
flow
.
float32
,
initializer
=
flow
.
random_uniform_initializer
(
minval
=
0
,
maxval
=
100
),
trainable
=
True
,
model_name
=
"bias"
,
)
loss
=
flow
.
math
.
reduce_sum
(
x
*
random_mask
)
flow
.
optimizer
.
SGD
(
flow
.
optimizer
.
PiecewiseScalingScheduler
(
base_lr
=
primary_lr
,
secondary_lr
=
secondary_lr
,
boundaries
=
[],
scale
=
1
,
),
momentum
=
momentum
,
).
minimize
(
loss
)
return
x
checkpoint
=
flow
.
train
.
CheckPoint
()
checkpoint
.
init
()
# generate random number sequences
random_masks_seq
=
[]
for
i
in
range
(
train_iters
+
1
):
random_masks_seq
.
append
(
np
.
random
.
uniform
(
size
=
x_shape
).
astype
(
np
.
float32
))
init_value
=
None
for
i
in
range
(
train_iters
+
1
):
x
=
testSGD
(
random_masks_seq
[
i
])
if
i
==
0
:
init_value
=
np
.
copy
(
x
)
var
=
tf
.
Variable
(
init_value
)
opt
=
tf
.
keras
.
optimizers
.
SGD
(
learning_rate
=
secondary_lr
,
momentum
=
momentum
,
nesterov
=
False
)
for
i
in
range
(
train_iters
):
with
tf
.
GradientTape
()
as
tape
:
random_mask
=
tf
.
Variable
(
random_masks_seq
[
i
])
loss
=
tf
.
reduce_sum
(
var
*
random_mask
)
gradients
=
tape
.
gradient
(
loss
,
var
)
opt
.
apply_gradients
(
zip
([
gradients
],
[
var
]))
assert
np
.
allclose
(
x
.
flatten
(),
var
.
numpy
().
flatten
(),
rtol
=
1e-4
,
atol
=
1e-4
,)
def
unique_grads
(
sparse_ids
,
sparse_grads
):
num_ids
=
np
.
prod
(
sparse_ids
.
shape
)
sparse_grads_shape
=
(
num_ids
,)
+
sparse_grads
.
shape
[
len
(
sparse_ids
.
shape
)
:]
...
...
@@ -1052,6 +1114,17 @@ class TestOptimizers(flow.unittest.TestCase):
for
arg
in
GenArgList
(
arg_dict
):
compare_with_tensorflow_sgd
(
*
arg
)
def
test_sgd_secondary_lr
(
test_case
):
arg_dict
=
OrderedDict
()
arg_dict
[
"device_type"
]
=
[
"cpu"
,
"gpu"
]
arg_dict
[
"x_shape"
]
=
[(
10
,)]
arg_dict
[
"momentum"
]
=
[
0.9
,
0.0
]
arg_dict
[
"primary_lr"
]
=
[
1
]
arg_dict
[
"secondary_lr"
]
=
[
2
]
arg_dict
[
"train_iters"
]
=
[
10
]
for
arg
in
GenArgList
(
arg_dict
):
compare_with_tensorflow_sgd_secondary_lr
(
*
arg
)
def
test_indexed_slices_sgd
(
test_case
):
arg_dict
=
OrderedDict
()
arg_dict
[
"device_type"
]
=
[
"gpu"
,
"cpu"
]
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录