提交 4a6f7cec 编写于 作者: 文幕地方's avatar 文幕地方

pair param with key when load trained model params

上级 91b79f69
...@@ -57,7 +57,7 @@ def load_model(config, model, optimizer=None): ...@@ -57,7 +57,7 @@ def load_model(config, model, optimizer=None):
if checkpoints.endswith('pdparams'): if checkpoints.endswith('pdparams'):
checkpoints = checkpoints.replace('.pdparams', '') checkpoints = checkpoints.replace('.pdparams', '')
assert os.path.exists(checkpoints + ".pdparams"), \ assert os.path.exists(checkpoints + ".pdparams"), \
f"The {checkpoints}.pdparams does not exists!" "The {}.pdparams does not exists!".format(checkpoints)
# load params from trained model # load params from trained model
params = paddle.load(checkpoints + '.pdparams') params = paddle.load(checkpoints + '.pdparams')
...@@ -65,14 +65,15 @@ def load_model(config, model, optimizer=None): ...@@ -65,14 +65,15 @@ def load_model(config, model, optimizer=None):
new_state_dict = {} new_state_dict = {}
for key, value in state_dict.items(): for key, value in state_dict.items():
if key not in params: if key not in params:
logger.warning(f"{key} not in loaded params {params.keys()} !") logger.warning("{} not in loaded params {} !".format(
key, params.keys()))
pre_value = params[key] pre_value = params[key]
if list(value.shape) == list(pre_value.shape): if list(value.shape) == list(pre_value.shape):
new_state_dict[key] = pre_value new_state_dict[key] = pre_value
else: else:
logger.warning( logger.warning(
f"The shape of model params {key} {value.shape} not matched with loaded params shape {pre_value.shape} !" "The shape of model params {} {} not matched with loaded params shape {} !".
) format(key, value.shape, pre_value.shape))
model.set_state_dict(new_state_dict) model.set_state_dict(new_state_dict)
optim_dict = paddle.load(checkpoints + '.pdopt') optim_dict = paddle.load(checkpoints + '.pdopt')
...@@ -99,7 +100,7 @@ def load_pretrained_params(model, path): ...@@ -99,7 +100,7 @@ def load_pretrained_params(model, path):
if path.endswith('pdparams'): if path.endswith('pdparams'):
path = path.replace('.pdparams', '') path = path.replace('.pdparams', '')
assert os.path.exists(path + ".pdparams"), \ assert os.path.exists(path + ".pdparams"), \
f"The {path}.pdparams does not exists!" "The {}.pdparams does not exists!".format(path)
params = paddle.load(path + '.pdparams') params = paddle.load(path + '.pdparams')
state_dict = model.state_dict() state_dict = model.state_dict()
...@@ -109,10 +110,10 @@ def load_pretrained_params(model, path): ...@@ -109,10 +110,10 @@ def load_pretrained_params(model, path):
new_state_dict[k1] = params[k2] new_state_dict[k1] = params[k2]
else: else:
logger.warning( logger.warning(
f"The shape of model params {k1} {state_dict[k1].shape} not matched with loaded params {k2} {params[k2].shape} !" "The shape of model params {} {} not matched with loaded params {} {} !".
) format(k1, state_dict[k1].shape, k2, params[k2].shape))
model.set_state_dict(new_state_dict) model.set_state_dict(new_state_dict)
logger.info(f"load pretrain successful from {path}") logger.info("load pretrain successful from {}".format(path))
return model return model
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册