diff --git a/paddle/fluid/operators/checkpoint_notify_op.cc b/paddle/fluid/operators/checkpoint_notify_op.cc index 3e5019dd4b167bf49162aec7fc375b8846d0c7e6..72976e22cacb5fc6c76838f4feff9cddfcf5aa83 100644 --- a/paddle/fluid/operators/checkpoint_notify_op.cc +++ b/paddle/fluid/operators/checkpoint_notify_op.cc @@ -43,7 +43,7 @@ class CheckpointNotifyOp : public framework::OperatorBase { detail::RPCClient::GetInstance(); for (size_t i = 0; i < epmap.size(); i++) { VLOG(3) << "sending " << dir <<" to " << epmap[i] << " to checkpoint notify ... "; - auto serial_looku_table = string::Sprintf("%s/%s.%d", dir, lookup_table_name, i); + auto serial_looku_table = string::Sprintf("%s/%s_%d", dir, lookup_table_name, i); rpc_client->AsyncCheckpointNotify(epmap[i], serial_looku_table); } rpc_client->Wait(); diff --git a/python/paddle/fluid/io.py b/python/paddle/fluid/io.py index ffe0021e96c3c09e0eba93cb38ee872c80bb1ae5..629ded7f7a6e27c16093c479f523384e864a7e15 100644 --- a/python/paddle/fluid/io.py +++ b/python/paddle/fluid/io.py @@ -462,7 +462,6 @@ CHECKPOINT_PREFIX = "checkpoint" MODEL_DIR = "__model__" LOOKUP_TABLE_DIR = "__lookup_table__" TRAINER_PREFIX = "trainer" -PSERVER_PREFIX = "pserver" CHECKPOINT_SEPARATOR = "_" @@ -577,8 +576,7 @@ def load_persist_vars_without_grad(executor, def load_lookup_table_vars(executor, dirname, pserver_id, table_name): lookup_table_dir = os.path.join(dirname, LOOKUP_TABLE_DIR) - table_file = table_name + CHECKPOINT_SEPARATOR + PSERVER_PREFIX + CHECKPOINT_SEPARATOR + str( - pserver_id) + table_file = table_name + CHECKPOINT_SEPARATOR + str(pserver_id) load_vars(executor, lookup_table_dir, vars=table_name, filename=table_file)