fix by review

93fecc89 · zhxfl · ec4fb544 · 93fecc89
隐藏空白更改
内联并排

Showing with 13 addition and 12 deletion

fluid/DeepASR/data_utils/data_reader.py fluid/DeepASR/data_utils/data_reader.py +13 -12

未找到文件。
--- a/fluid/DeepASR/data_utils/data_reader.py
+++ b/fluid/DeepASR/data_utils/data_reader.py
@@ -61,9 +61,9 @@ class SampleInfoBucket(object):
        label_bin_paths (list|tuple): Files containing the binary label data.
        label_desc_paths (list|tuple): Files containing the description of
                                       samples' label data.
-        split_perturb(int): split long sentence' perturb sub-sentence length value. 
+        split_perturb(int): Random perturb sub-sentence length when split long sentence. 
-        split_sentence_threshold(int): sentence length large than 
+        split_sentence_threshold(int): Sentence whose length larger than 
-                                    split_sentence_threshold trigger split operator.
+                                the value will trigger split operation.
        split_sub_sentence_len(int): sub-sentence length is equal to 
                                    (split_sub_sentence_len + rand() % split_perturb).
    """
@@ -133,8 +133,8 @@ class SampleInfoBucket(object):
                    remain_frame_num = feature_frame_num
                    while True:
                        if remain_frame_num > self._split_sentence_threshold:
-                            cur_frame_len = self._split_sub_sentence_len + random.randint(
+                            cur_frame_len = self._split_sub_sentence_len + \
-                                0, self._split_perturb)
+                                    self._rng.randint(0, self._split_perturb)
                            if cur_frame_len > remain_frame_num:
                                cur_frame_len = remain_frame_num
                        else:
@@ -291,11 +291,12 @@ class DataReader(object):
                                           sample_info.feature_start,
                                           sample_info.feature_size)
-                assert sample_info.feature_frame_num * sample_info.feature_dim * 4 == len(
+                assert sample_info.feature_frame_num * sample_info.feature_dim * 4 \
-                    feature_bytes), (sample_info.feature_bin_path,
+                        == len(feature_bytes), \
-                                     sample_info.feature_frame_num,
+                        (sample_info.feature_bin_path,
-                                     sample_info.feature_dim,
+                         sample_info.feature_frame_num,
-                                     len(feature_bytes))
+                         sample_info.feature_dim,
+                         len(feature_bytes))
                label_bytes = read_bytes(sample_info.label_bin_path,
                                         sample_info.label_start,
@@ -329,8 +330,8 @@ class DataReader(object):
                    time.sleep(0.001)
                # drop long sentence
-                if self._drop_frame_len == -1 or self._drop_frame_len >= sample_data[
+                if self._drop_frame_len == -1 or \
-                        0].shape[0]:
+                        self._drop_frame_len >= sample_data[0].shape[0]:
                    sample_queue.put(sample_data)
                out_order[0] += 1