refactor: update

7cef93a6 · gongel · 5b5c73f9 · 7cef93a6 · 7cef93a6 · 7cef93a6
6 changed file
--- a/examples/ted_en_zh/t1/README.md
+++ b/examples/ted_en_zh/t1/README.md
@@ -3,13 +3,14 @@
 ## Dataset
-| Data Subset | Duration in Seconds |
+| Data Subset | Duration in Frames |
 | --- | --- |
-| data/manifest.train | 0.942 ~ 60   |
+| data/manifest.train | 94.2 ~ 6000   |
-| data/manifest.dev   | 1.151 ~ 39   |
+| data/manifest.dev   | 115.1 ~ 3900   |
-| data/manifest.test  | 1.1 ~ 42.746 |
+| data/manifest.test  | 110 ~ 4274.6 |
 ## Transformer
-| Model | Params | Config | Char-BLEU |
+| Model | Params | Config | Val loss | Char-BLEU |
-| --- | --- | --- | --- |
+| --- | --- | --- | --- | --- |
-| Transformer+ASR MTL | 50.26M | conf/transformer_joint_noam.yaml | 17.38 |
+| FAT + Transformer+ASR MTL | 50.26M | conf/transformer_mtl_noam.yaml | 62.86 | 19.45 |
+| FAT + Transformer+ASR MTL with word reward | 50.26M | conf/transformer_mtl_noam.yaml | 62.86 | 20.80 |
--- a/examples/ted_en_zh/t1/conf/transformer_joint_noam.yaml
+++ b/examples/ted_en_zh/t1/conf/transformer_joint_noam.yaml
--- a/examples/ted_en_zh/t1/local/convert_torch_to_paddle.py
+++ b/examples/ted_en_zh/t1/local/convert_torch_to_paddle.py
@@ -27,6 +27,7 @@ def torch2paddle(args):
    torch_model = torch.load(args.torch_ckpt, map_location='cpu')
    cnt = 0
    for k, v in torch_model['model'].items():
+        # encoder.embed.* --> encoder.embed.*
        if k.startswith('encoder.embed'):
            if v.ndim == 2:
                v = v.transpose(0, 1)
@@ -35,6 +36,10 @@ def torch2paddle(args):
            logger.info(
                f"Convert torch weight: {k} to paddlepaddle weight: {k}, shape is {v.shape}"
            )
+        # encoder.after_norm.* --> encoder.after_norm.*
+        # encoder.after_norm.* --> decoder.after_norm.*
+        # encoder.after_norm.* --> st_decoder.after_norm.*
        if k.startswith('encoder.after_norm'):
            paddle_model_dict[k] = v.numpy()
            cnt += 1
@@ -47,6 +52,10 @@ def torch2paddle(args):
                f"Convert torch weight: {k} to paddlepaddle weight: {'st_'+ k.replace('en','de')}, shape is {v.shape}"
            )
            cnt += 2
+        # encoder.encoders.* --> encoder.encoders.*
+        # encoder.encoders.* (last six layers) --> decoder.encoders.* (first six layers)
+        # encoder.encoders.* (last six layers) --> st_decoder.encoders.* (first six layers)
        if k.startswith('encoder.encoders'):
            if v.ndim == 2:
                v = v.transpose(0, 1)

--- a/examples/ted_en_zh/t1/local/download_pretrain.sh
+++ b/examples/ted_en_zh/t1/local/download_pretrain.sh
+#!/bin/bash
+# download pytorch weight
+wget https://paddlespeech.bj.bcebos.com/s2t/ted_en_zh/st1/snapshot.ep.98 --no-check-certificate
+# convert pytorch weight to paddlepaddle
+python local/convert_torch_to_paddle.py \
+--torch_ckpt snapshot.ep.98 \
+--paddle_ckpt paddle.98.pdparams
+# Or you can download converted weights
+# wget https://paddlespeech.bj.bcebos.com/s2t/ted_en_zh/st1/paddle.98.pdparams --no-check-certificate
+if [ $? -ne 0 ]; then
+    echo "Failed in downloading and coverting!"
+    exit 1
+fi
+exit 0
\ No newline at end of file
--- a/examples/ted_en_zh/t1/local/train.sh
+++ b/examples/ted_en_zh/t1/local/train.sh
--- a/examples/ted_en_zh/t1/run.sh
+++ b/examples/ted_en_zh/t1/run.sh
@@ -4,8 +4,8 @@ source path.sh
 gpus=0,1,2,3
 stage=1
-stop_stage=100
+stop_stage=4
-conf_path=conf/transformer_joint_noam.yaml
+conf_path=conf/transformer_mtl_noam.yaml
 ckpt_path=paddle.98
 avg_num=5
 data_path=./TED_EnZh # path to unzipped data
@@ -22,21 +22,21 @@ if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then
 fi
 if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
-    # train model, all `ckpt` under `exp` dir
+    # download pretrained
-    CUDA_VISIBLE_DEVICES=${gpus} ./local/train.sh ${conf_path}  ${ckpt} ${ckpt_path}
+    bash ./local/download_pretrain.sh || exit -1
 fi
 if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
-    # avg n best model
+    # train model, all `ckpt` under `exp` dir
-    avg.sh best exp/${ckpt}/checkpoints ${avg_num}
+    CUDA_VISIBLE_DEVICES=${gpus} ./local/train_finetune.sh ${conf_path}  ${ckpt} ${ckpt_path}
 fi
 if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
-    # test ckpt avg_n
+    # avg n best model
-    CUDA_VISIBLE_DEVICES=0 ./local/test.sh ${conf_path} exp/${ckpt}/checkpoints/${avg_ckpt} || exit -1
+    avg.sh best exp/${ckpt}/checkpoints ${avg_num}
 fi
 if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
-    # export ckpt avg_n
+    # test ckpt avg_n
-    CUDA_VISIBLE_DEVICES= ./local/export.sh ${conf_path} exp/${ckpt}/checkpoints/${avg_ckpt} exp/${ckpt}/checkpoints/${avg_ckpt}.jit
+    CUDA_VISIBLE_DEVICES=0 ./local/test.sh ${conf_path} exp/${ckpt}/checkpoints/${avg_ckpt} || exit -1
 fi
\ No newline at end of file