Merge pull request #1991 from yt605155624/fix_mfa

[TTS]gen lexicon with tone in mfa, test=tts

Merge pull request #1991 from yt605155624/fix_mfa
[TTS]gen lexicon with tone in mfa, test=tts
0c6dddb1 · 小湉湉 · GitHub · aa3d151d · 9a253bc0 · 0c6dddb1
隐藏空白更改
内联并排

Showing with 2 addition and 7 deletion

examples/other/mfa/local/reorganize_baker.py examples/other/mfa/local/reorganize_baker.py +0 -3

examples/other/mfa/run.sh examples/other/mfa/run.sh +2 -4

未找到文件。
--- a/examples/other/mfa/local/reorganize_baker.py
+++ b/examples/other/mfa/local/reorganize_baker.py
@@ -42,9 +42,6 @@ def get_transcripts(path: Union[str, Path]):
    for i in range(0, len(lines), 2):
        sentence_id = lines[i].split()[0]
        transcription = lines[i + 1].strip()
-        # tones are dropped here
-        # since the lexicon does not consider tones, too
-        transcription = " ".join([item[:-1] for item in transcription.split()])
        transcripts[sentence_id] = transcription

    return transcripts

--- a/examples/other/mfa/run.sh
+++ b/examples/other/mfa/run.sh
@@ -4,7 +4,7 @@ mkdir -p $EXP_DIR
 LEXICON_NAME='simple'
 if [ ! -f "$EXP_DIR/$LEXICON_NAME.lexicon" ]; then
    echo "generating lexicon..."
-    python local/generate_lexicon.py "$EXP_DIR/$LEXICON_NAME" --with-r
+    python local/generate_lexicon.py "$EXP_DIR/$LEXICON_NAME" --with-r --with-tone
    echo "lexicon done"
 fi

@@ -16,6 +16,7 @@ if [ ! -d $EXP_DIR/baker_corpus ]; then
    echo "transcription for each audio file is saved with the same namd in $EXP_DIR/baker_corpus "
 fi

+
 echo "detecting oov..."
 python local/detect_oov.py $EXP_DIR/baker_corpus $EXP_DIR/"$LEXICON_NAME.lexicon"
 echo "detecting oov done. you may consider regenerate lexicon if there is unexpected OOVs."
@@ -44,6 +45,3 @@ if [ ! -d "$EXP_DIR/baker_alignment" ]; then
    echo "model: $EXP_DIR/baker_model"
 fi

-
-
-