diff --git a/paddle/fluid/operators/checkpoint_load_op.cc b/paddle/fluid/operators/checkpoint_load_op.cc index 6c88cbdab0758da5160a14b9353f6d4a40074ebf..18871e56c5017134d7d00f9b809752c684aba333 100644 --- a/paddle/fluid/operators/checkpoint_load_op.cc +++ b/paddle/fluid/operators/checkpoint_load_op.cc @@ -114,8 +114,8 @@ class CheckpointLoadOp : public framework::OperatorBase { std::string dir = Attr("dir"); std::string serial_num_attr = Attr("Serial"); - PADDLE_ENFORCE(IsNumber(serial_num_attr), - "Checkpoint Serial must be a number"); + VLOG(3) << "CheckpointLoadOp get Attr dir: " << dir; + VLOG(3) << "CheckpointLoadOp get Attr Serial: " << serial_num_attr; std::string serial_var_name = std::string(SERIAL_VAR); auto *serial_var = scope.FindVar(serial_var_name); diff --git a/python/paddle/fluid/transpiler/distribute_transpiler.py b/python/paddle/fluid/transpiler/distribute_transpiler.py index 335dc2342d08c01cafd6e7588d8470ea00a2c830..bb1e026a6b1ffdc5af5cec0e6ef536f5c1279a47 100644 --- a/python/paddle/fluid/transpiler/distribute_transpiler.py +++ b/python/paddle/fluid/transpiler/distribute_transpiler.py @@ -654,6 +654,9 @@ class DistributeTranspiler: if os.path.isfile(success_path): return int(cur_dir) + if os.path.isdir(checkpoint_dir): + return "-1" + current_dir = 0 dirs = os.listdir(checkpoint_dir) for cur_dir in dirs: