From 04a225ae4f8f7f4af068207627bb65b93bdd5fe6 Mon Sep 17 00:00:00 2001 From: Xinghai Sun Date: Wed, 14 Jun 2017 18:14:50 +0800 Subject: [PATCH] Enable min_batch_num in train.py and update train info print. --- compute_mean_std.py | 0 data_utils/__init__.py | 0 data_utils/audio.py | 0 data_utils/augmentor/__init__.py | 0 data_utils/augmentor/augmentation.py | 0 data_utils/augmentor/base.py | 0 data_utils/augmentor/volume_perturb.py | 0 data_utils/featurizer/__init__.py | 0 data_utils/featurizer/audio_featurizer.py | 0 data_utils/featurizer/speech_featurizer.py | 0 data_utils/featurizer/text_featurizer.py | 0 data_utils/normalizer.py | 0 data_utils/speech.py | 0 data_utils/utils.py | 0 datasets/run_all.sh | 0 decoder.py | 0 train.py | 10 ++++++---- 17 files changed, 6 insertions(+), 4 deletions(-) mode change 100755 => 100644 compute_mean_std.py mode change 100755 => 100644 data_utils/__init__.py mode change 100755 => 100644 data_utils/audio.py mode change 100755 => 100644 data_utils/augmentor/__init__.py mode change 100755 => 100644 data_utils/augmentor/augmentation.py mode change 100755 => 100644 data_utils/augmentor/base.py mode change 100755 => 100644 data_utils/augmentor/volume_perturb.py mode change 100755 => 100644 data_utils/featurizer/__init__.py mode change 100755 => 100644 data_utils/featurizer/audio_featurizer.py mode change 100755 => 100644 data_utils/featurizer/speech_featurizer.py mode change 100755 => 100644 data_utils/featurizer/text_featurizer.py mode change 100755 => 100644 data_utils/normalizer.py mode change 100755 => 100644 data_utils/speech.py mode change 100755 => 100644 data_utils/utils.py mode change 100755 => 100644 datasets/run_all.sh mode change 100755 => 100644 decoder.py diff --git a/compute_mean_std.py b/compute_mean_std.py old mode 100755 new mode 100644 diff --git a/data_utils/__init__.py b/data_utils/__init__.py old mode 100755 new mode 100644 diff --git a/data_utils/audio.py b/data_utils/audio.py old mode 100755 new mode 100644 diff --git a/data_utils/augmentor/__init__.py b/data_utils/augmentor/__init__.py old mode 100755 new mode 100644 diff --git a/data_utils/augmentor/augmentation.py b/data_utils/augmentor/augmentation.py old mode 100755 new mode 100644 diff --git a/data_utils/augmentor/base.py b/data_utils/augmentor/base.py old mode 100755 new mode 100644 diff --git a/data_utils/augmentor/volume_perturb.py b/data_utils/augmentor/volume_perturb.py old mode 100755 new mode 100644 diff --git a/data_utils/featurizer/__init__.py b/data_utils/featurizer/__init__.py old mode 100755 new mode 100644 diff --git a/data_utils/featurizer/audio_featurizer.py b/data_utils/featurizer/audio_featurizer.py old mode 100755 new mode 100644 diff --git a/data_utils/featurizer/speech_featurizer.py b/data_utils/featurizer/speech_featurizer.py old mode 100755 new mode 100644 diff --git a/data_utils/featurizer/text_featurizer.py b/data_utils/featurizer/text_featurizer.py old mode 100755 new mode 100644 diff --git a/data_utils/normalizer.py b/data_utils/normalizer.py old mode 100755 new mode 100644 diff --git a/data_utils/speech.py b/data_utils/speech.py old mode 100755 new mode 100644 diff --git a/data_utils/utils.py b/data_utils/utils.py old mode 100755 new mode 100644 diff --git a/datasets/run_all.sh b/datasets/run_all.sh old mode 100755 new mode 100644 diff --git a/decoder.py b/decoder.py old mode 100755 new mode 100644 diff --git a/train.py b/train.py index 7ac4626f..6074aa35 100644 --- a/train.py +++ b/train.py @@ -143,11 +143,13 @@ def train(): train_batch_reader = train_generator.batch_reader_creator( manifest_path=args.train_manifest_path, batch_size=args.batch_size, + min_batch_size=args.trainer_count, sortagrad=args.use_sortagrad if args.init_model_path is None else False, batch_shuffle=True) test_batch_reader = test_generator.batch_reader_creator( manifest_path=args.dev_manifest_path, batch_size=args.batch_size, + min_batch_size=1, # must be 1, but will have errors. sortagrad=False, batch_shuffle=False) @@ -157,11 +159,11 @@ def train(): if isinstance(event, paddle.event.EndIteration): cost_sum += event.cost cost_counter += 1 - if event.batch_id % 50 == 0: - print("\nPass: %d, Batch: %d, TrainCost: %f" % - (event.pass_id, event.batch_id, cost_sum / cost_counter)) + if (event.batch_id + 1) % 100 == 0: + print("\nPass: %d, Batch: %d, TrainCost: %f" % ( + event.pass_id, event.batch_id + 1, cost_sum / cost_counter)) cost_sum, cost_counter = 0.0, 0 - with gzip.open("params_tmp.tar.gz", 'w') as f: + with gzip.open("params.tar.gz", 'w') as f: parameters.to_tar(f) else: sys.stdout.write('.') -- GitLab