Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
PaddleHub
提交
5653fc55
P
PaddleHub
项目概览
PaddlePaddle
/
PaddleHub
1 年多 前同步成功
通知
283
Star
12117
Fork
2091
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
200
列表
看板
标记
里程碑
合并请求
4
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
PaddleHub
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
200
Issue
200
列表
看板
标记
里程碑
合并请求
4
合并请求
4
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
5653fc55
编写于
5月 28, 2020
作者:
S
Steffy-zxf
提交者:
GitHub
5月 28, 2020
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
update strategy (#636)
* update strategy
上级
4e9a68e6
变更
2
隐藏空白更改
内联
并排
Showing
2 changed file
with
37 addition
and
24 deletion
+37
-24
paddlehub/finetune/strategy.py
paddlehub/finetune/strategy.py
+36
-23
paddlehub/version.py
paddlehub/version.py
+1
-1
未找到文件。
paddlehub/finetune/strategy.py
浏览文件 @
5653fc55
...
@@ -133,39 +133,39 @@ def set_gradual_unfreeze(depth_params_dict, unfreeze_depths):
...
@@ -133,39 +133,39 @@ def set_gradual_unfreeze(depth_params_dict, unfreeze_depths):
class
DefaultStrategy
(
object
):
class
DefaultStrategy
(
object
):
def
__init__
(
self
,
learning_rate
=
1e-4
,
optimizer_name
=
"adam"
):
def
__init__
(
self
,
learning_rate
=
1e-4
,
optimizer_name
=
"adam"
,
**
kwargs
):
self
.
learning_rate
=
learning_rate
self
.
learning_rate
=
learning_rate
self
.
_optimizer_name
=
optimizer_name
self
.
_optimizer_name
=
optimizer_name
if
self
.
_optimizer_name
.
lower
()
==
"sgd"
:
if
self
.
_optimizer_name
.
lower
()
==
"sgd"
:
self
.
optimizer
=
fluid
.
optimizer
.
SGD
(
self
.
optimizer
=
fluid
.
optimizer
.
SGD
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"adagrad"
:
elif
self
.
_optimizer_name
.
lower
()
==
"adagrad"
:
self
.
optimizer
=
fluid
.
optimizer
.
Adagrad
(
self
.
optimizer
=
fluid
.
optimizer
.
Adagrad
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"adamax"
:
elif
self
.
_optimizer_name
.
lower
()
==
"adamax"
:
self
.
optimizer
=
fluid
.
optimizer
.
Adamax
(
self
.
optimizer
=
fluid
.
optimizer
.
Adamax
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"decayedadagrad"
:
elif
self
.
_optimizer_name
.
lower
()
==
"decayedadagrad"
:
self
.
optimizer
=
fluid
.
optimizer
.
DecayedAdagrad
(
self
.
optimizer
=
fluid
.
optimizer
.
DecayedAdagrad
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"ftrl"
:
elif
self
.
_optimizer_name
.
lower
()
==
"ftrl"
:
self
.
optimizer
=
fluid
.
optimizer
.
Ftrl
(
self
.
optimizer
=
fluid
.
optimizer
.
Ftrl
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"larsmomentum"
:
elif
self
.
_optimizer_name
.
lower
()
==
"larsmomentum"
:
self
.
optimizer
=
fluid
.
optimizer
.
LarsMomentum
(
self
.
optimizer
=
fluid
.
optimizer
.
LarsMomentum
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"momentum"
:
elif
self
.
_optimizer_name
.
lower
()
==
"momentum"
:
self
.
optimizer
=
fluid
.
optimizer
.
Momentum
(
self
.
optimizer
=
fluid
.
optimizer
.
Momentum
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"decayedadagrad"
:
elif
self
.
_optimizer_name
.
lower
()
==
"decayedadagrad"
:
self
.
optimizer
=
fluid
.
optimizer
.
DecayedAdagrad
(
self
.
optimizer
=
fluid
.
optimizer
.
DecayedAdagrad
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
elif
self
.
_optimizer_name
.
lower
()
==
"rmsprop"
:
elif
self
.
_optimizer_name
.
lower
()
==
"rmsprop"
:
self
.
optimizer
=
fluid
.
optimizer
.
RMSPropOptimizer
(
self
.
optimizer
=
fluid
.
optimizer
.
RMSPropOptimizer
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
else
:
else
:
self
.
optimizer
=
fluid
.
optimizer
.
Adam
(
self
.
optimizer
=
fluid
.
optimizer
.
Adam
(
learning_rate
=
self
.
learning_rate
)
learning_rate
=
self
.
learning_rate
,
**
kwargs
)
def
execute
(
self
,
loss
,
data_reader
,
config
,
dev_count
):
def
execute
(
self
,
loss
,
data_reader
,
config
,
dev_count
):
if
self
.
optimizer
is
not
None
:
if
self
.
optimizer
is
not
None
:
...
@@ -186,10 +186,13 @@ class CombinedStrategy(DefaultStrategy):
...
@@ -186,10 +186,13 @@ class CombinedStrategy(DefaultStrategy):
learning_rate
=
1e-4
,
learning_rate
=
1e-4
,
scheduler
=
None
,
scheduler
=
None
,
regularization
=
None
,
regularization
=
None
,
clip
=
None
):
clip
=
None
,
**
kwargs
):
super
(
CombinedStrategy
,
self
).
__init__
(
super
(
CombinedStrategy
,
self
).
__init__
(
optimizer_name
=
optimizer_name
,
learning_rate
=
learning_rate
)
optimizer_name
=
optimizer_name
,
learning_rate
=
learning_rate
,
**
kwargs
)
self
.
kwargs
=
kwargs
# init set
# init set
self
.
scheduler
=
{
self
.
scheduler
=
{
"warmup"
:
0.0
,
"warmup"
:
0.0
,
...
@@ -379,7 +382,9 @@ class CombinedStrategy(DefaultStrategy):
...
@@ -379,7 +382,9 @@ class CombinedStrategy(DefaultStrategy):
# set optimizer
# set optimizer
super
(
CombinedStrategy
,
self
).
__init__
(
super
(
CombinedStrategy
,
self
).
__init__
(
optimizer_name
=
self
.
_optimizer_name
,
learning_rate
=
scheduled_lr
)
optimizer_name
=
self
.
_optimizer_name
,
learning_rate
=
scheduled_lr
,
**
self
.
kwargs
)
# discriminative learning rate
# discriminative learning rate
# based on layer
# based on layer
...
@@ -564,7 +569,8 @@ class AdamWeightDecayStrategy(CombinedStrategy):
...
@@ -564,7 +569,8 @@ class AdamWeightDecayStrategy(CombinedStrategy):
lr_scheduler
=
"linear_decay"
,
lr_scheduler
=
"linear_decay"
,
warmup_proportion
=
0.1
,
warmup_proportion
=
0.1
,
weight_decay
=
0.01
,
weight_decay
=
0.01
,
optimizer_name
=
"adam"
):
optimizer_name
=
"adam"
,
**
kwargs
):
scheduler
=
{
"warmup"
:
warmup_proportion
}
scheduler
=
{
"warmup"
:
warmup_proportion
}
if
lr_scheduler
==
"noam_decay"
:
if
lr_scheduler
==
"noam_decay"
:
scheduler
[
"noam_decay"
]
=
True
scheduler
[
"noam_decay"
]
=
True
...
@@ -583,14 +589,16 @@ class AdamWeightDecayStrategy(CombinedStrategy):
...
@@ -583,14 +589,16 @@ class AdamWeightDecayStrategy(CombinedStrategy):
learning_rate
=
learning_rate
,
learning_rate
=
learning_rate
,
scheduler
=
scheduler
,
scheduler
=
scheduler
,
regularization
=
regularization
,
regularization
=
regularization
,
clip
=
clip
)
clip
=
clip
,
**
kwargs
)
class
L2SPFinetuneStrategy
(
CombinedStrategy
):
class
L2SPFinetuneStrategy
(
CombinedStrategy
):
def
__init__
(
self
,
def
__init__
(
self
,
learning_rate
=
1e-4
,
learning_rate
=
1e-4
,
optimizer_name
=
"adam"
,
optimizer_name
=
"adam"
,
regularization_coeff
=
1e-3
):
regularization_coeff
=
1e-3
,
**
kwargs
):
scheduler
=
{}
scheduler
=
{}
regularization
=
{
"L2SP"
:
regularization_coeff
}
regularization
=
{
"L2SP"
:
regularization_coeff
}
clip
=
{}
clip
=
{}
...
@@ -599,14 +607,16 @@ class L2SPFinetuneStrategy(CombinedStrategy):
...
@@ -599,14 +607,16 @@ class L2SPFinetuneStrategy(CombinedStrategy):
learning_rate
=
learning_rate
,
learning_rate
=
learning_rate
,
scheduler
=
scheduler
,
scheduler
=
scheduler
,
regularization
=
regularization
,
regularization
=
regularization
,
clip
=
clip
)
clip
=
clip
,
**
kwargs
)
class
DefaultFinetuneStrategy
(
CombinedStrategy
):
class
DefaultFinetuneStrategy
(
CombinedStrategy
):
def
__init__
(
self
,
def
__init__
(
self
,
learning_rate
=
1e-4
,
learning_rate
=
1e-4
,
optimizer_name
=
"adam"
,
optimizer_name
=
"adam"
,
regularization_coeff
=
1e-3
):
regularization_coeff
=
1e-3
,
**
kwargs
):
scheduler
=
{}
scheduler
=
{}
regularization
=
{
"L2"
:
regularization_coeff
}
regularization
=
{
"L2"
:
regularization_coeff
}
clip
=
{}
clip
=
{}
...
@@ -616,7 +626,8 @@ class DefaultFinetuneStrategy(CombinedStrategy):
...
@@ -616,7 +626,8 @@ class DefaultFinetuneStrategy(CombinedStrategy):
learning_rate
=
learning_rate
,
learning_rate
=
learning_rate
,
scheduler
=
scheduler
,
scheduler
=
scheduler
,
regularization
=
regularization
,
regularization
=
regularization
,
clip
=
clip
)
clip
=
clip
,
**
kwargs
)
class
ULMFiTStrategy
(
CombinedStrategy
):
class
ULMFiTStrategy
(
CombinedStrategy
):
...
@@ -629,7 +640,8 @@ class ULMFiTStrategy(CombinedStrategy):
...
@@ -629,7 +640,8 @@ class ULMFiTStrategy(CombinedStrategy):
factor
=
2.6
,
factor
=
2.6
,
dis_params_layer
=
None
,
dis_params_layer
=
None
,
frz_blocks
=
3
,
frz_blocks
=
3
,
frz_params_layer
=
None
):
frz_params_layer
=
None
,
**
kwargs
):
scheduler
=
{
scheduler
=
{
"slanted_triangle"
:
{
"slanted_triangle"
:
{
...
@@ -653,4 +665,5 @@ class ULMFiTStrategy(CombinedStrategy):
...
@@ -653,4 +665,5 @@ class ULMFiTStrategy(CombinedStrategy):
learning_rate
=
learning_rate
,
learning_rate
=
learning_rate
,
scheduler
=
scheduler
,
scheduler
=
scheduler
,
regularization
=
regularization
,
regularization
=
regularization
,
clip
=
clip
)
clip
=
clip
,
**
kwargs
)
paddlehub/version.py
浏览文件 @
5653fc55
...
@@ -13,5 +13,5 @@
...
@@ -13,5 +13,5 @@
# See the License for the specific language governing permissions and
# See the License for the specific language governing permissions and
# limitations under the License.
# limitations under the License.
""" PaddleHub version string """
""" PaddleHub version string """
hub_version
=
"1.7.
0
"
hub_version
=
"1.7.
1
"
module_proto_version
=
"1.0.0"
module_proto_version
=
"1.0.0"
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录