提交 5b804b70 编写于 作者: L lifuchen

modified some config name and default path.

上级 abdc0a72
...@@ -126,10 +126,10 @@ python synthesis.py \ ...@@ -126,10 +126,10 @@ python synthesis.py \
--checkpoint=${CHECKPOINTPATH} \ --checkpoint=${CHECKPOINTPATH} \
--config='configs/ljspeech.yaml' \ --config='configs/ljspeech.yaml' \
--output=${OUTPUTPATH} \ --output=${OUTPUTPATH} \
--vocoder='griffinlim' \ --vocoder='griffin-lim' \
``` ```
We currently support two vocoders, ``griffinlim`` and ``waveflow``. You can set ``--vocoder`` to use one of them. If you want to use ``waveflow`` as your vocoder, you need to set ``--config_vocoder`` and ``--checkpoint_vocoder`` which are the path of the config and checkpoint of vocoder. You can download the pretrain model of ``waveflow`` from [here](https://github.com/PaddlePaddle/Parakeet#vocoders). We currently support two vocoders, ``Griffin-Lim`` algorithm and ``WaveFlow``. You can set ``--vocoder`` to use one of them. If you want to use ``waveflow`` as your vocoder, you need to set ``--config_vocoder`` and ``--checkpoint_vocoder`` which are the path of the config and checkpoint of vocoder. You can download the pre-trained model of ``waveflow`` from [here](https://github.com/PaddlePaddle/Parakeet#vocoders).
Or you can run the script file directly. Or you can run the script file directly.
......
...@@ -39,8 +39,8 @@ def add_config_options_to_parser(parser): ...@@ -39,8 +39,8 @@ def add_config_options_to_parser(parser):
parser.add_argument( parser.add_argument(
"--vocoder", "--vocoder",
type=str, type=str,
default="griffinlim", default="griffin-lim",
choices=['griffinlim', 'waveflow'], choices=['griffin-lim', 'waveflow'],
help="vocoder method") help="vocoder method")
parser.add_argument( parser.add_argument(
"--config_vocoder", type=str, help="path of the vocoder config file") "--config_vocoder", type=str, help="path of the vocoder config file")
...@@ -53,11 +53,11 @@ def add_config_options_to_parser(parser): ...@@ -53,11 +53,11 @@ def add_config_options_to_parser(parser):
) )
parser.add_argument( parser.add_argument(
"--checkpoint", type=str, help="fastspeech checkpoint to synthesis") "--checkpoint", type=str, help="fastspeech checkpoint for synthesis")
parser.add_argument( parser.add_argument(
"--checkpoint_vocoder", "--checkpoint_vocoder",
type=str, type=str,
help="vocoder checkpoint to synthesis") help="vocoder checkpoint for synthesis")
parser.add_argument( parser.add_argument(
"--output", "--output",
...@@ -96,7 +96,7 @@ def synthesis(text_input, args): ...@@ -96,7 +96,7 @@ def synthesis(text_input, args):
_, mel_output_postnet = model(text, pos_text, alpha=args.alpha) _, mel_output_postnet = model(text, pos_text, alpha=args.alpha)
if args.vocoder == 'griffinlim': if args.vocoder == 'griffin-lim':
#synthesis use griffin-lim #synthesis use griffin-lim
wav = synthesis_with_griffinlim(mel_output_postnet, cfg['audio']) wav = synthesis_with_griffinlim(mel_output_postnet, cfg['audio'])
elif args.vocoder == 'waveflow': elif args.vocoder == 'waveflow':
......
...@@ -4,12 +4,12 @@ CUDA_VISIBLE_DEVICES=0 \ ...@@ -4,12 +4,12 @@ CUDA_VISIBLE_DEVICES=0 \
python -u synthesis.py \ python -u synthesis.py \
--use_gpu=1 \ --use_gpu=1 \
--alpha=1.0 \ --alpha=1.0 \
--checkpoint='./checkpoint/fastspeech/step-162000' \ --checkpoint='./fastspeech_ljspeech_ckpt_1.0/fastspeech/step-162000' \
--config='configs/ljspeech.yaml' \ --config='fastspeech_ljspeech_ckpt_1.0/ljspeech.yaml' \
--output='./synthesis' \ --output='./synthesis' \
--vocoder='waveflow' \ --vocoder='waveflow' \
--config_vocoder='../waveflow/checkpoint/waveflow_res128_ljspeech_ckpt_1.0/waveflow_ljspeech.yaml' \ --config_vocoder='./waveflow_res128_ljspeech_ckpt_1.0/waveflow_ljspeech.yaml' \
--checkpoint_vocoder='../waveflow/checkpoint/waveflow_res128_ljspeech_ckpt_1.0/step-2000000' \ --checkpoint_vocoder='./waveflow_res128_ljspeech_ckpt_1.0/step-2000000' \
......
...@@ -95,10 +95,10 @@ python synthesis.py \ ...@@ -95,10 +95,10 @@ python synthesis.py \
--output=${OUTPUTPATH} \ --output=${OUTPUTPATH} \
--config='configs/ljspeech.yaml' \ --config='configs/ljspeech.yaml' \
--checkpoint_transformer=${CHECKPOINTPATH} \ --checkpoint_transformer=${CHECKPOINTPATH} \
--vocoder='griffinlim' \ --vocoder='griffin-lim' \
``` ```
We currently support two vocoders, ``griffinlim`` and ``waveflow``. You can set ``--vocoder`` to use one of them. If you want to use ``waveflow`` as your vocoder, you need to set ``--config_vocoder`` and ``--checkpoint_vocoder`` which are the path of the config and checkpoint of vocoder. You can download the pretrain model of ``waveflow`` from [here](https://github.com/PaddlePaddle/Parakeet#vocoders). We currently support two vocoders, ``Griffin-Lim`` algorithm and ``WaveFlow``. You can set ``--vocoder`` to use one of them. If you want to use ``waveflow`` as your vocoder, you need to set ``--config_vocoder`` and ``--checkpoint_vocoder`` which are the path of the config and checkpoint of vocoder. You can download the pre-trained model of ``waveflow`` from [here](https://github.com/PaddlePaddle/Parakeet#vocoders).
Or you can run the script file directly. Or you can run the script file directly.
......
...@@ -49,19 +49,19 @@ def add_config_options_to_parser(parser): ...@@ -49,19 +49,19 @@ def add_config_options_to_parser(parser):
parser.add_argument( parser.add_argument(
"--checkpoint_transformer", "--checkpoint_transformer",
type=str, type=str,
help="transformer_tts checkpoint to synthesis") help="transformer_tts checkpoint for synthesis")
parser.add_argument( parser.add_argument(
"--vocoder", "--vocoder",
type=str, type=str,
default="griffinlim", default="griffin-lim",
choices=['griffinlim', 'waveflow'], choices=['griffin-lim', 'waveflow'],
help="vocoder method") help="vocoder method")
parser.add_argument( parser.add_argument(
"--config_vocoder", type=str, help="path of the vocoder config file") "--config_vocoder", type=str, help="path of the vocoder config file")
parser.add_argument( parser.add_argument(
"--checkpoint_vocoder", "--checkpoint_vocoder",
type=str, type=str,
help="vocoder checkpoint to synthesis") help="vocoder checkpoint for synthesis")
parser.add_argument( parser.add_argument(
"--output", "--output",
...@@ -124,7 +124,7 @@ def synthesis(text_input, args): ...@@ -124,7 +124,7 @@ def synthesis(text_input, args):
i * 4 + j, i * 4 + j,
dataformats="HWC") dataformats="HWC")
if args.vocoder == 'griffinlim': if args.vocoder == 'griffin-lim':
#synthesis use griffin-lim #synthesis use griffin-lim
wav = synthesis_with_griffinlim(postnet_pred, cfg['audio']) wav = synthesis_with_griffinlim(postnet_pred, cfg['audio'])
elif args.vocoder == 'waveflow': elif args.vocoder == 'waveflow':
......
...@@ -4,11 +4,11 @@ CUDA_VISIBLE_DEVICES=0 \ ...@@ -4,11 +4,11 @@ CUDA_VISIBLE_DEVICES=0 \
python -u synthesis.py \ python -u synthesis.py \
--use_gpu=0 \ --use_gpu=0 \
--output='./synthesis' \ --output='./synthesis' \
--config='configs/ljspeech.yaml' \ --config='transformer_tts_ljspeech_ckpt_1.0/ljspeech.yaml' \
--checkpoint_transformer='./checkpoint/transformer/step-120000' \ --checkpoint_transformer='./transformer_tts_ljspeech_ckpt_1.0/step-120000' \
--vocoder='waveflow' \ --vocoder='waveflow' \
--config_vocoder='../waveflow/checkpoint/waveflow_res128_ljspeech_ckpt_1.0/waveflow_ljspeech.yaml' \ --config_vocoder='./waveflow_res128_ljspeech_ckpt_1.0/waveflow_ljspeech.yaml' \
--checkpoint_vocoder='../waveflow/checkpoint/waveflow_res128_ljspeech_ckpt_1.0/step-2000000' \ --checkpoint_vocoder='./waveflow_res128_ljspeech_ckpt_1.0/step-2000000' \
if [ $? -ne 0 ]; then if [ $? -ne 0 ]; then
echo "Failed in training!" echo "Failed in training!"
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册