diff --git a/demos/streaming_tts_server/test_client.sh b/demos/streaming_tts_server/test_client.sh index 333ae00d2aac97e05787b79918f00f0920df0308..8698209521d4ed05ca53d4844e7b7bcba06f7cca 100644 --- a/demos/streaming_tts_server/test_client.sh +++ b/demos/streaming_tts_server/test_client.sh @@ -1,7 +1,7 @@ #!/bin/bash # http client test -paddlespeech_client tts --server_ip 127.0.0.1 --port 8092 --protocol http --input "您好,欢迎使用百度飞桨语音合成服务。" --output output.wav +paddlespeech_client tts_online --server_ip 127.0.0.1 --port 8092 --protocol http --input "您好,欢迎使用百度飞桨语音合成服务。" --output output.wav # websocket client test -#paddlespeech_client tts --server_ip 127.0.0.1 --port 8092 --protocol websocket --input "您好,欢迎使用百度飞桨语音合成服务。" --output output.wav \ No newline at end of file +#paddlespeech_client tts_online --server_ip 127.0.0.1 --port 8092 --protocol websocket --input "您好,欢迎使用百度飞桨语音合成服务。" --output output.wav diff --git a/paddlespeech/server/utils/audio_process.py b/paddlespeech/server/utils/audio_process.py index c6dad889128f057db2da39d8b944d60670635b5d..6fb5bb832af4caab8d3b9065cd5a9630ccf2a311 100644 --- a/paddlespeech/server/utils/audio_process.py +++ b/paddlespeech/server/utils/audio_process.py @@ -157,7 +157,7 @@ def save_audio(bytes_data, audio_path, sample_rate: int=24000) -> bool: if audio_path.endswith("pcm"): with open(audio_path, "wb") as f: - f.write(bubytes_dataffer) + f.write(bytes_data) elif audio_path.endswith("wav"): with open("./tmp.pcm", "wb") as f: f.write(bytes_data) diff --git a/paddlespeech/t2s/modules/predictor/length_regulator.py b/paddlespeech/t2s/modules/predictor/length_regulator.py index b64aa44ad4ca3b4403ba1092d5ecf22fac15ff71..e4fbf54916ed98948fffe8bf8325a312928efa57 100644 --- a/paddlespeech/t2s/modules/predictor/length_regulator.py +++ b/paddlespeech/t2s/modules/predictor/length_regulator.py @@ -49,7 +49,9 @@ class LengthRegulator(nn.Layer): encodings: (B, T, C) durations: (B, T) """ - batch_size, t_enc = durations.shape + #batch_size, t_enc = durations.shape # linux + batch_size = paddle.shape(durations)[0] # windows and mac + t_enc = paddle.shape(durations)[1] # windows and mac durations = durations.numpy() slens = np.sum(durations, -1) t_dec = np.max(slens)