update mrc

d87bd156 · wangxiao1021 · 78742b4b · d87bd156 · d87bd156 · d87bd156
隐藏空白更改
内联并排

Showing with 6 addition and 7 deletion

README.md README.md +2 -2

examples/mrc/README.md examples/mrc/README.md +1 -1

examples/mrc/run.py examples/mrc/run.py +3 -4

未找到文件。
--- a/README.md
+++ b/README.md
@@ -103,8 +103,8 @@ You can easily re-produce following competitive results with minor codes, which
      <td>94.9</td>
      <td>94.5</td>
      <td>94.7</td>
-      <td>96.3</td>
-      <td>84.0</td>
+      <td>64.3</td>
+      <td>85.2</td>
    </tr>

  </tbody>

--- a/examples/mrc/README.md
+++ b/examples/mrc/README.md
@@ -94,5 +94,5 @@ The evaluation results are as follows:

 ```
 data_num: 3219
-em_sroce: 0.963031997515, f1: 83.9865402973
+em_sroce: 64.3367505436, f1: 85.1781896843
 ```
--- a/examples/mrc/run.py
+++ b/examples/mrc/run.py
@@ -9,7 +9,7 @@ if __name__ == '__main__':
    # configs
    max_seqlen = 512
    batch_size = 8   
-    num_epochs = 8
+    num_epochs = 2
    lr = 3e-5
    doc_stride = 128
    max_query_len = 64
@@ -64,8 +64,7 @@ if __name__ == '__main__':
    # step 8-1*: load pretrained parameters
    trainer.load_pretrain(pre_params)
    # step 8-2*: set saver to save model
-    # save_steps = (n_steps-8)  // 4
-    save_steps = 1520
+    save_steps = 3040
    trainer.set_saver(save_path=save_path, save_steps=save_steps, save_type=save_type)
    # step 8-3: start training
    trainer.train(print_steps=print_steps)
@@ -90,7 +89,7 @@ if __name__ == '__main__':
    trainer.build_predict_forward(pred_ernie, mrc_pred_head)

    # step 6: load checkpoint
-    pred_model_path =  './outputs/ckpt.step'+str(12160)
+    pred_model_path =  './outputs/ckpt.step'+str(3040)
    trainer.load_ckpt(pred_model_path)
    
    # step 7: fit prepared reader and data