Merge branch 'develop' of github.com:SmileGoat/PaddleSpeech into add_fbank

bc21a584 · Yang Zhou · 0d4018c2 · a0308992 · bc21a584 · bc21a584
Showing with 18 addition and 18 deletion

examples/other/mfa/local/reorganize_aishell3.py examples/other/mfa/local/reorganize_aishell3.py +16 -16

paddlespeech/t2s/exps/voice_cloning.py paddlespeech/t2s/exps/voice_cloning.py +2 -2

未找到文件。
--- a/examples/other/mfa/local/reorganize_aishell3.py
+++ b/examples/other/mfa/local/reorganize_aishell3.py
--- a/paddlespeech/t2s/exps/voice_cloning.py
+++ b/paddlespeech/t2s/exps/voice_cloning.py
@@ -110,10 +110,10 @@ def voice_cloning(args):
        print(f"{utt_id} done!")
    # Randomly generate numbers of 0 ~ 0.2, 256 is the dim of spk_emb
    random_spk_emb = np.random.rand(256) * 0.2
-    random_spk_emb = paddle.to_tensor(random_spk_emb)
+    random_spk_emb = paddle.to_tensor(random_spk_emb, dtype='float32')
    utt_id = "random_spk_emb"
    with paddle.no_grad():
-        wav = voc_inference(am_inference(phone_ids, spk_emb=spk_emb))
+        wav = voc_inference(am_inference(phone_ids, spk_emb=random_spk_emb))
    sf.write(
        str(output_dir / (utt_id + ".wav")),
        wav.numpy(),