未验证 提交 b14da765 编写于 作者: 小湉湉's avatar 小湉湉 提交者: GitHub

frm random spk embedding in voice cloning, test=doc (#2429)

上级 861dc2a9
...@@ -135,16 +135,16 @@ def voice_cloning(args): ...@@ -135,16 +135,16 @@ def voice_cloning(args):
print(f"{utt_id} done!") print(f"{utt_id} done!")
# generate 5 random_spk_emb # generate 5 random_spk_emb
for i in range(5): # for i in range(5):
random_spk_emb = gen_random_embed(args.use_ecapa) # random_spk_emb = gen_random_embed(args.use_ecapa)
utt_id = "random_spk_emb" # utt_id = "random_spk_emb"
with paddle.no_grad(): # with paddle.no_grad():
wav = voc_inference(am_inference(phone_ids, spk_emb=random_spk_emb)) # wav = voc_inference(am_inference(phone_ids, spk_emb=random_spk_emb))
sf.write( # sf.write(
str(output_dir / (utt_id + "_" + str(i) + ".wav")), # str(output_dir / (utt_id + "_" + str(i) + ".wav")),
wav.numpy(), # wav.numpy(),
samplerate=am_config.fs) # samplerate=am_config.fs)
print(f"{utt_id} done!") # print(f"{utt_id} done!")
def parse_args(): def parse_args():
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册