提交 fd009bb0 编写于 作者: C chenfeiyu

use os.path instead of pathlib.

上级 86fff7a0
...@@ -12,7 +12,7 @@ ...@@ -12,7 +12,7 @@
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
from pathlib import Path import os
import numpy as np import numpy as np
import pandas as pd import pandas as pd
import librosa import librosa
...@@ -27,13 +27,11 @@ from ..data.batch import TextIDBatcher, SpecBatcher ...@@ -27,13 +27,11 @@ from ..data.batch import TextIDBatcher, SpecBatcher
class LJSpeech(DatasetMixin): class LJSpeech(DatasetMixin):
def __init__(self, root): def __init__(self, root):
super(LJSpeech, self).__init__() super(LJSpeech, self).__init__()
assert isinstance(root, ( self.root = root
str, Path)), "root should be a string or Path object"
self.root = root if isinstance(root, Path) else Path(root)
self.metadata = self._prepare_metadata() self.metadata = self._prepare_metadata()
def _prepare_metadata(self): def _prepare_metadata(self):
csv_path = self.root.joinpath("metadata.csv") csv_path = os.path.join(self.root, "metadata.csv")
metadata = pd.read_csv( metadata = pd.read_csv(
csv_path, csv_path,
sep="|", sep="|",
...@@ -51,7 +49,7 @@ class LJSpeech(DatasetMixin): ...@@ -51,7 +49,7 @@ class LJSpeech(DatasetMixin):
""" """
fname, raw_text, normalized_text = metadatum fname, raw_text, normalized_text = metadatum
wav_path = self.root.joinpath("wavs", fname + ".wav") wav_path = os.path.join(self.root, "wavs", fname + ".wav")
# load -> trim -> preemphasis -> stft -> magnitude -> mel_scale -> logscale -> normalize # load -> trim -> preemphasis -> stft -> magnitude -> mel_scale -> logscale -> normalize
wav, sample_rate = librosa.load( wav, sample_rate = librosa.load(
......
...@@ -12,6 +12,7 @@ ...@@ -12,6 +12,7 @@
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
import os
import random import random
import librosa import librosa
...@@ -32,7 +33,7 @@ class Dataset(ljspeech.LJSpeech): ...@@ -32,7 +33,7 @@ class Dataset(ljspeech.LJSpeech):
def _get_example(self, metadatum): def _get_example(self, metadatum):
fname, _, _ = metadatum fname, _, _ = metadatum
wav_path = self.root.joinpath("wavs", fname + ".wav") wav_path = os.path.join(self.root, "wavs", fname + ".wav")
loaded_sr, audio = read(wav_path) loaded_sr, audio = read(wav_path)
assert loaded_sr == self.config.sample_rate assert loaded_sr == self.config.sample_rate
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册