未验证 提交 8f98cd7b 编写于 作者: W Wenyu 提交者: GitHub

add arg eta_min (#4815)

上级 23c1bc39
...@@ -42,9 +42,10 @@ class CosineDecay(object): ...@@ -42,9 +42,10 @@ class CosineDecay(object):
the max_iters is much larger than the warmup iter the max_iters is much larger than the warmup iter
""" """
def __init__(self, max_epochs=1000, use_warmup=True): def __init__(self, max_epochs=1000, use_warmup=True, eta_min=0):
self.max_epochs = max_epochs self.max_epochs = max_epochs
self.use_warmup = use_warmup self.use_warmup = use_warmup
self.eta_min = eta_min
def __call__(self, def __call__(self,
base_lr=None, base_lr=None,
...@@ -66,7 +67,8 @@ class CosineDecay(object): ...@@ -66,7 +67,8 @@ class CosineDecay(object):
value.append(decayed_lr) value.append(decayed_lr)
return optimizer.lr.PiecewiseDecay(boundary, value) return optimizer.lr.PiecewiseDecay(boundary, value)
return optimizer.lr.CosineAnnealingDecay(base_lr, T_max=max_iters) return optimizer.lr.CosineAnnealingDecay(
base_lr, T_max=max_iters, eta_min=self.eta_min)
@serializable @serializable
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册