fix add_eos_sos and cmvn

9876bdb4 · Hui Zhang · 28658cc1 · 9876bdb4 · 9876bdb4 · 9876bdb4
4 changed file
--- a/.gitignore
+++ b/.gitignore
@@ -9,3 +9,4 @@ tools/venv
 *.tar
 *.tar.gz
 .ipynb_checkpoints
+*.npz
--- a/.notebook/u2_model.ipynb
+++ b/.notebook/u2_model.ipynb
--- a/deepspeech/frontend/normalizer.py
+++ b/deepspeech/frontend/normalizer.py
@@ -101,7 +101,7 @@ class FeatureNormalizer(object):
            features.append(
                featurize_func(AudioSegment.from_file(instance["feat"])))
        features = np.hstack(features)  #(D, T)
-        self._mean = np.mean(features, axis=1).reshape([1, -1])  #(1, D)
+        self._mean = np.mean(features, axis=1)  #(D,)
-        std = np.std(features, axis=1).reshape([1, -1])  #(1, D)
+        std = np.std(features, axis=1)  #(D,)
        std = np.clip(std, eps, None)
        self._istd = 1.0 / std
--- a/deepspeech/utils/tensor_utils.py
+++ b/deepspeech/utils/tensor_utils.py
@@ -132,7 +132,7 @@ def add_sos_eos(ys_pad: paddle.Tensor, sos: int, eos: int,
    ys_out = paddle.cat([ys_pad, _eos], dim=1)
    ys_out = ys_out.masked_fill(mask_pad, eos)
-    mask_eos = (ys_in == ignore_id)
+    mask_eos = (ys_out == ignore_id)
    ys_out = ys_out.masked_fill(mask_eos, eos)
    ys_out = ys_out.masked_fill(mask_pad, ignore_id)
    return ys_in, ys_out