fix audio shape bug for audio len

9c0b6c5b · Hui Zhang · 718bd307 · 9c0b6c5b
隐藏空白更改
内联并排

Showing with 3 addition and 3 deletion

deepspeech/io/collator.py deepspeech/io/collator.py +3 -3

未找到文件。
--- a/deepspeech/io/collator.py
+++ b/deepspeech/io/collator.py
@@ -154,8 +154,8 @@ class SpeechCollator():
            random_seed (int, optional): for random generator. Defaults to 0.
            keep_transcription_text (bool, optional): True, when not in training mode, will not do tokenizer; Defaults to False.
            if ``keep_transcription_text`` is False, text is token ids else is raw string.
-        
-        Do augmentations 
+
+        Do augmentations
        Padding audio features with zeros to make them have the same shape (or
        a user-defined shape) within one batch.
        """
@@ -271,7 +271,7 @@ class SpeechCollator():
            utts.append(utt)
            # audio
            audios.append(audio)  # [T, D]
-            audio_lens.append(audio.shape[1])
+            audio_lens.append(audio.shape[0])
            # text
            # for training, text is token ids
            # else text is string, convert to unicode ord