From a2b70aa698cd2e642d734073a101ec361344b204 Mon Sep 17 00:00:00 2001
From: Meiyim <chen_xuyi@outlook.com>
Date: Mon, 15 Nov 2021 10:59:17 +0800
Subject: [PATCH] Fix for pd22 (#763)

* fix-load-pretrained model

* update readme

* fix path
---
 README.zh.md                            | 2 +-
 demo/distill/distill.py                 | 2 +-
 demo/finetune_classifier.py             | 6 +++---
 demo/finetune_classifier_distributed.py | 6 +++---
 demo/finetune_mrc.py                    | 4 ++--
 demo/finetune_ner.py                    | 4 ++--
 demo/finetune_sentiment_analysis.py     | 6 +++---
 demo/pretrain/pretrain.py               | 2 +-
 demo/seq2seq/decode.py                  | 2 +-
 demo/seq2seq/finetune_seq2seq.py        | 6 +++---
 ernie/modeling_ernie.py                 | 2 +-
 11 files changed, 21 insertions(+), 21 deletions(-)

diff --git a/README.zh.md b/README.zh.md
index 543dbd4..a087240 100644
--- a/README.zh.md
+++ b/README.zh.md
@@ -173,7 +173,7 @@ data/xnli
 - 使用 `动态图` 模型进行finetune:
 
 ```script
-python3 ./ernie_d/demo/finetune_classifier.py \
+python3 ./demo/finetune_classifier.py \
        --from_pretrained ernie-1.0 \
        --data_dir ./data/xnli
 ```
diff --git a/demo/distill/distill.py b/demo/distill/distill.py
index a8c2c34..344e087 100644
--- a/demo/distill/distill.py
+++ b/demo/distill/distill.py
@@ -153,7 +153,7 @@ if not os.path.exists('./teacher_model.bin'):
             if step % 100 == 0:
                 f1 = evaluate_teacher(teacher_model, dev_ds)
                 print('teacher f1: %.5f' % f1)
-    P.save(teacher_model.state_dict(), './teacher_model.bin')
+    P.save(teacher_model.state_dict(),str( './teacher_model.bin'))
 else:
     state_dict = P.load('./teacher_model.bin')
     teacher_model.set_state_dict(state_dict)
diff --git a/demo/finetune_classifier.py b/demo/finetune_classifier.py
index ce14d3e..c5f7c89 100644
--- a/demo/finetune_classifier.py
+++ b/demo/finetune_classifier.py
@@ -162,7 +162,7 @@ model = ErnieModelForSequenceClassification.from_pretrained(
 
 if args.init_checkpoint is not None:
     log.info('loading checkpoint from %s' % args.init_checkpoint)
-    sd = P.load(args.init_checkpoint)
+    sd = P.load(str(args.init_checkpoint))
     model.set_state_dict(sd)
 
 g_clip = P.nn.ClipGradByGlobalNorm(1.0)  #experimental
@@ -238,9 +238,9 @@ with LogWriter(
                     log_writer.add_scalar('eval/acc', acc, step=step)
                     log.debug('acc %.5f' % acc)
                     if args.save_dir is not None:
-                        P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+                        P.save(model.state_dict(), str(args.save_dir / 'ckpt.bin'))
 if args.save_dir is not None:
-    P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+    P.save(model.state_dict(),str( args.save_dir / 'ckpt.bin'))
 if args.inference_model_dir is not None:
 
     class InferenceModel(ErnieModelForSequenceClassification):
diff --git a/demo/finetune_classifier_distributed.py b/demo/finetune_classifier_distributed.py
index d4b1195..3dfc4b8 100644
--- a/demo/finetune_classifier_distributed.py
+++ b/demo/finetune_classifier_distributed.py
@@ -128,7 +128,7 @@ model = ErnieModelForSequenceClassification.from_pretrained(
 
 if args.init_checkpoint is not None:
     log.info('loading checkpoint from %s' % args.init_checkpoint)
-    sd = P.load(args.init_checkpoint)
+    sd = P.load(str(args.init_checkpoint))
     model.set_state_dict(sd)
 
 model = P.DataParallel(model)
@@ -195,11 +195,11 @@ with P.amp.auto_cast(enable=args.use_amp):
             #log_writer.add_scalar('eval/acc', acc, step=step)
             log.debug('acc %.5f' % acc)
             if args.save_dir is not None:
-                P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+                P.save(model.state_dict(),str( args.save_dir / 'ckpt.bin'))
         # exit 
         if step > args.max_steps:
             break
 
 if args.save_dir is not None and env.dev_id == 0:
-    P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+    P.save(model.state_dict(),str( args.save_dir / 'ckpt.bin'))
 log.debug('done')
diff --git a/demo/finetune_mrc.py b/demo/finetune_mrc.py
index 9b8ffe0..f5172aa 100644
--- a/demo/finetune_mrc.py
+++ b/demo/finetune_mrc.py
@@ -145,7 +145,7 @@ def train(model, train_dataset, dev_dataset, dev_examples, dev_features,
                 log.debug('[step %d] eval result: f1 %.5f em %.5f' %
                           (step, f1, em))
             if env.dev_id == 0 and args.save_dir is not None:
-                P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+                P.save(model.state_dict(), str(args.save_dir / 'ckpt.bin'))
             if step > max_steps:
                 break
 
@@ -244,4 +244,4 @@ if __name__ == "__main__":
                           tokenizer, args)
         log.debug('final eval result: f1 %.5f em %.5f' % (f1, em))
     if env.dev_id == 0 and args.save_dir is not None:
-        P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+        P.save(model.state_dict(), str(args.save_dir / 'ckpt.bin'))
diff --git a/demo/finetune_ner.py b/demo/finetune_ner.py
index 6929afd..46dd2cc 100644
--- a/demo/finetune_ner.py
+++ b/demo/finetune_ner.py
@@ -249,10 +249,10 @@ with LogWriter(
                     log.debug('eval f1: %.5f' % f1)
                     log_writer.add_scalar('eval/f1', f1, step=step)
                     if args.save_dir is not None:
-                        P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+                        P.save(model.state_dict(),str( args.save_dir / 'ckpt.bin'))
 
 f1 = evaluate(model, dev_ds)
 log.debug('final eval f1: %.5f' % f1)
 log_writer.add_scalar('eval/f1', f1, step=step)
 if args.save_dir is not None:
-    P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+    P.save(model.state_dict(),str( args.save_dir / 'ckpt.bin'))
diff --git a/demo/finetune_sentiment_analysis.py b/demo/finetune_sentiment_analysis.py
index 16087fa..99b7247 100644
--- a/demo/finetune_sentiment_analysis.py
+++ b/demo/finetune_sentiment_analysis.py
@@ -177,9 +177,9 @@ if not args.eval:
                         log.debug('acc %.5f' % acc)
                         if args.save_dir is not None:
                             P.save(model.state_dict(),
-                                   args.save_dir / 'ckpt.bin')
+                                   str(args.save_dir / 'ckpt.bin'))
         if args.save_dir is not None:
-            P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+            P.save(model.state_dict(), str(args.save_dir / 'ckpt.bin'))
 else:
     feature_column = propeller.data.FeatureColumns([
         propeller.data.TextColumn(
@@ -189,7 +189,7 @@ else:
             tokenizer=tokenizer.tokenize),
     ])
 
-    sd = P.load(args.init_checkpoint)
+    sd = P.load(str(args.init_checkpoint))
     model.set_dict(sd)
     model.eval()
 
diff --git a/demo/pretrain/pretrain.py b/demo/pretrain/pretrain.py
index c1521b9..63f0aa1 100644
--- a/demo/pretrain/pretrain.py
+++ b/demo/pretrain/pretrain.py
@@ -394,7 +394,7 @@ if __name__ == '__main__':
                 log.debug(msg)
             if step % 1000 == 0 and env.dev_id == 0:
                 log.debug('saveing...')
-                P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+                P.save(model.state_dict(),str( args.save_dir / 'ckpt.bin'))
             if step > args.max_steps:
                 break
     log.info('done')
diff --git a/demo/seq2seq/decode.py b/demo/seq2seq/decode.py
index 0d551e7..d0f4427 100644
--- a/demo/seq2seq/decode.py
+++ b/demo/seq2seq/decode.py
@@ -401,7 +401,7 @@ if __name__ == '__main__':
     rev_dict[tokenizer.pad_id] = ''  # replace [PAD]
     rev_dict[tokenizer.unk_id] = ''  # replace [PAD]
 
-    sd = P.load(args.save_dir)
+    sd = P.load(str(args.save_dir))
     ernie.set_state_dict(sd)
 
     def map_fn(src_ids):
diff --git a/demo/seq2seq/finetune_seq2seq.py b/demo/seq2seq/finetune_seq2seq.py
index 937ad88..07bdada 100644
--- a/demo/seq2seq/finetune_seq2seq.py
+++ b/demo/seq2seq/finetune_seq2seq.py
@@ -308,7 +308,7 @@ def seq2seq(model, tokenizer, args):
                 log.debug(msg)
 
             if args.save_dir is not None and step % 1000 == 0 and env.dev_id == 0:
-                P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+                P.save(model.state_dict(), str(args.save_dir / 'ckpt.bin'))
 
             if args.predict_output_dir is not None and step > args.skip_eval_steps and step % args.eval_steps == 0:
                 assert  args.predict_output_dir.exists(), \
@@ -320,7 +320,7 @@ def seq2seq(model, tokenizer, args):
         evaluate(model, dev_ds, step, args)
 
     if args.save_dir is not None:
-        P.save(model.state_dict(), args.save_dir / 'ckpt.bin')
+        P.save(model.state_dict(),str( args.save_dir / 'ckpt.bin'))
 
 
 if __name__ == '__main__':
@@ -414,7 +414,7 @@ if __name__ == '__main__':
 
     if args.init_checkpoint is not None:
         log.info('loading checkpoint from %s' % args.init_checkpoint)
-        sd = P.load(args.init_checkpoint)
+        sd = P.load(str(args.init_checkpoint))
         ernie.set_state_dict(sd)
 
     seq2seq(ernie, tokenizer, args)
diff --git a/ernie/modeling_ernie.py b/ernie/modeling_ernie.py
index e0d5a9f..c8a9808 100644
--- a/ernie/modeling_ernie.py
+++ b/ernie/modeling_ernie.py
@@ -290,7 +290,7 @@ class PretrainedModel(object):
         #    log.debug('load pretrained weight from program state')
         #    F.io.load_program_state(param_path) #buggy in dygraph.gurad, push paddle to fix
         if state_dict_path.exists():
-            m = P.load(state_dict_path)
+            m = P.load(str(state_dict_path))
             for k, v in model.state_dict().items():
                 if k not in m:
                     log.warn('param:%s not set in pretrained model, skip' % k)
-- 
GitLab