提交 3e2b7c5e 编写于 作者: G gaoyuan

adjust local learning rate

上级 4a02beb9
...@@ -13,7 +13,7 @@ def conv_bn(input, ...@@ -13,7 +13,7 @@ def conv_bn(input,
num_groups=1, num_groups=1,
act='relu', act='relu',
use_cudnn=True): use_cudnn=True):
parameter_attr = ParamAttr(initializer=MSRA()) parameter_attr = ParamAttr(learning_rate=0.1, initializer=MSRA())
conv = fluid.layers.conv2d( conv = fluid.layers.conv2d(
input=input, input=input,
num_filters=num_filters, num_filters=num_filters,
...@@ -25,7 +25,14 @@ def conv_bn(input, ...@@ -25,7 +25,14 @@ def conv_bn(input,
use_cudnn=use_cudnn, use_cudnn=use_cudnn,
param_attr=parameter_attr, param_attr=parameter_attr,
bias_attr=False) bias_attr=False)
return fluid.layers.batch_norm(input=conv, act=act, epsilon=0.00001) parameter_attr = ParamAttr(learning_rate=0.1, initializer=MSRA())
bias_attr = ParamAttr(learning_rate=0.2)
return fluid.layers.batch_norm(
input=conv,
act=act,
epsilon=0.00001,
param_attr=parameter_attr,
bias_attr=bias_attr)
def depthwise_separable(input, num_filters1, num_filters2, num_groups, stride, def depthwise_separable(input, num_filters1, num_filters2, num_groups, stride,
......
...@@ -150,6 +150,7 @@ def _reader_creator(settings, file_list, mode, shuffle): ...@@ -150,6 +150,7 @@ def _reader_creator(settings, file_list, mode, shuffle):
img = np.swapaxes(img, 1, 2) img = np.swapaxes(img, 1, 2)
img = np.swapaxes(img, 1, 0) img = np.swapaxes(img, 1, 0)
img = img[[2, 1, 0], :, :]
img = img.astype('float32') img = img.astype('float32')
img -= settings.img_mean img -= settings.img_mean
img = img.flatten() img = img.flatten()
......
...@@ -45,13 +45,14 @@ def train(train_file_list, ...@@ -45,13 +45,14 @@ def train(train_file_list,
evaluate_difficult=False, evaluate_difficult=False,
ap_version='11point') ap_version='11point')
optimizer = fluid.optimizer.DecayedAdagrad( optimizer = fluid.optimizer.Momentum(
learning_rate=fluid.layers.exponential_decay( learning_rate=fluid.layers.exponential_decay(
learning_rate=learning_rate, learning_rate=learning_rate,
decay_steps=40000, decay_steps=40000,
decay_rate=0.1, decay_rate=0.1,
staircase=True), staircase=True),
regularization=fluid.regularizer.L2Decay(0.0005), ) momentum=0.9,
regularization=fluid.regularizer.L2Decay(0.00005), )
optimizer.minimize(loss) optimizer.minimize(loss)
...@@ -59,7 +60,7 @@ def train(train_file_list, ...@@ -59,7 +60,7 @@ def train(train_file_list,
exe = fluid.Executor(place) exe = fluid.Executor(place)
exe.run(fluid.default_startup_program()) exe.run(fluid.default_startup_program())
load_model.load_and_set_vars(place) load_model.load_paddlev1_vars(place)
train_reader = paddle.batch( train_reader = paddle.batch(
reader.train(data_args, train_file_list), batch_size=batch_size) reader.train(data_args, train_file_list), batch_size=batch_size)
test_reader = paddle.batch( test_reader = paddle.batch(
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册