add audio augmentation

bfa4dd98 · chrisxu2014 · 3d4aba57 · bfa4dd98 · bfa4dd98
显示空白变更内容
内联并排

Showing with 7 addition and 7 deletion

deep_speech_2/data_utils/audio.py deep_speech_2/data_utils/audio.py +3 -3

deep_speech_2/data_utils/speech.py deep_speech_2/data_utils/speech.py +4 -4

未找到文件。
--- a/deep_speech_2/data_utils/audio.py
+++ b/deep_speech_2/data_utils/audio.py
@@ -88,7 +88,7 @@ class AudioSegment(object):
        :rtype: AudioSegment
        :raises ValueError: If the number of segments is zero, or if the 
                            sample_rate of any two segments does not match.
-        :raises TypeError: If every item in segments is not Audiosegment
+        :raises TypeError: If every item in segments is not AudioSegment
                           instance.
        """
        # Perform basic sanity-checks.
@@ -296,7 +296,7 @@ class AudioSegment(object):
        :type prior_db: float
        :param prior_samples: Prior strength in number of samples.
        :type prior_samples: float
-        :param startup_delay: Default 0.0 s. If provided, this function will
+        :param startup_delay: Default 0.0s. If provided, this function will
                              accrue statistics for the first startup_delay 
                              seconds before applying online normalization.
        :type startup_delay: float
@@ -401,7 +401,7 @@ class AudioSegment(object):
        self.subsegment(start_time, start_time + subsegment_length)
    def convolve(self, impulse_segment, allow_resample=False):
-        """Convolve this audio segment with the given filter.
+        """Convolve this audio segment with the given impulse_segment.
        Note that this is an in-place transformation.

--- a/deep_speech_2/data_utils/speech.py
+++ b/deep_speech_2/data_utils/speech.py
@@ -75,11 +75,11 @@ class SpeechSegment(AudioSegment):
        :rtype: SpeechSegment
        :raises ValueError: If the number of segments is zero, or if the 
                            sample_rate of any two segments does not match.
-        :raises TypeError: If every item in segments is not Audiosegment
+        :raises TypeError: If every item in segments is not SpeechSegment
                           instance.
        """
        if len(segments) == 0:
-            raise ValueError("No audio segments are given to concatenate.")
+            raise ValueError("No speech segments are given to concatenate.")
        sample_rate = segments[0]._sample_rate
        transcripts = ""
        for seg in segments:
@@ -116,7 +116,7 @@ class SpeechSegment(AudioSegment):
        :rtype: SpeechSegment
        """
        audio = Audiosegment.slice_from_file(filepath, start, end)
-        return cls(audio.samples, audio.sample_rate, transcripts)
+        return cls(audio.samples, audio.sample_rate, transcript)
    @classmethod
    def make_silence(cls, duration, sample_rate):
@@ -128,7 +128,7 @@ class SpeechSegment(AudioSegment):
        :param sample_rate: Sample rate.
        :type sample_rate: float
        :return: Silence of the given duration.
-        :rtype: AudioSegment
+        :rtype: SpeechSegment
        """
        audio = AudioSegment.make_silence(duration, sample_rate)
        return cls(audio.samples, audio.sample_rate, "")