diff --git a/paddlespeech/t2s/modules/losses.py b/paddlespeech/t2s/modules/losses.py index 93644e24aac93553bb938672ab22065b8740051e..db31bcfbb4361281df49d3afeb00dfb97c59d7f9 100644 --- a/paddlespeech/t2s/modules/losses.py +++ b/paddlespeech/t2s/modules/losses.py @@ -489,7 +489,7 @@ def stft(x, """ # calculate window window = signal.get_window(window, win_length, fftbins=True) - window = paddle.to_tensor(window) + window = paddle.to_tensor(window, dtype=x.dtype) x_stft = paddle.signal.stft( x, fft_size, @@ -896,7 +896,7 @@ class MelSpectrogram(nn.Layer): # calculate window window = signal.get_window( self.window, self.win_length, fftbins=True) - window = paddle.to_tensor(window) + window = paddle.to_tensor(window, dtype=x.dtype) else: window = None