diff --git a/examples/librispeech/asr1/conf/chunk_transformer.yaml b/examples/librispeech/asr1/conf/chunk_transformer.yaml index fe533777630a3aa1c26577492457ff2e4c06c848..c2644daf4a76b671e72e8fbae5d8f0278fdc460a 100644 --- a/examples/librispeech/asr1/conf/chunk_transformer.yaml +++ b/examples/librispeech/asr1/conf/chunk_transformer.yaml @@ -11,9 +11,9 @@ data: max_output_input_ratio: 100.0 collator: - vocab_filepath: data/vocab.txt + vocab_filepath: data/lang_char/vocab.txt unit_type: 'spm' - spm_model_prefix: 'data/bpe_unigram_5000' + spm_model_prefix: 'data/lang_char/bpe_unigram_5000' mean_std_filepath: "" augmentation_config: conf/preprocess.yaml batch_size: 64 diff --git a/examples/librispeech/asr2/conf/preprocess.yaml b/examples/librispeech/asr2/conf/preprocess.yaml new file mode 100644 index 0000000000000000000000000000000000000000..bc86d98c1aca87b69e66a3725321a44242c42c60 --- /dev/null +++ b/examples/librispeech/asr2/conf/preprocess.yaml @@ -0,0 +1,16 @@ +process: + # these three processes are a.k.a. SpecAugument + - type: time_warp + max_time_warp: 5 + inplace: true + mode: PIL + - type: freq_mask + F: 30 + n_mask: 2 + inplace: true + replace_with_zero: false + - type: time_mask + T: 40 + n_mask: 2 + inplace: true + replace_with_zero: false diff --git a/examples/librispeech/asr2/conf/transformer.yaml b/examples/librispeech/asr2/conf/transformer.yaml index de1ac347a8f2b57377c3493a804b8d07141f082f..4a50183a9c84ce1470966e833f163efe38a960e5 100644 --- a/examples/librispeech/asr2/conf/transformer.yaml +++ b/examples/librispeech/asr2/conf/transformer.yaml @@ -57,7 +57,7 @@ collator: batch_frames_in: 0 batch_frames_out: 0 batch_frames_inout: 0 - augmentation_config: conf/augmentation.json + augmentation_config: conf/preprocess.yaml num_workers: 0 subsampling_factor: 1 num_encs: 1