From 0780d181d29d8470ba3579aa0d0ef9465c5ad264 Mon Sep 17 00:00:00 2001
From: xiongxinlei <xiongxinlei@baidu.com>
Date: Wed, 2 Mar 2022 20:55:31 +0800
Subject: [PATCH] remove personal code test=doc

---
 dataset/voxceleb/voxceleb1.py        | 106 ++++++++++++++++-----------
 examples/voxceleb/sv0/local/train.py |  24 +++++-
 examples/voxceleb/sv0/run.sh         |   4 +-
 3 files changed, 85 insertions(+), 49 deletions(-)

diff --git a/dataset/voxceleb/voxceleb1.py b/dataset/voxceleb/voxceleb1.py
index 0c9c68dc..b2d5f5c3 100644
--- a/dataset/voxceleb/voxceleb1.py
+++ b/dataset/voxceleb/voxceleb1.py
@@ -11,23 +11,26 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
 import collections
 import csv
 import glob
 import os
 import random
-from typing import Dict, List, Tuple
+from typing import Dict
+from typing import List
+from typing import Tuple
 
 from paddle.io import Dataset
-from tqdm import tqdm
 from pathos.multiprocessing import Pool
+from tqdm import tqdm
 
 from paddleaudio.backends import load as load_audio
-from paddleaudio.utils import DATA_HOME, decompress, download_and_decompress
 from paddleaudio.datasets.dataset import feat_funcs
-from utils.utility import unpack
+from paddleaudio.utils import DATA_HOME
+from paddleaudio.utils import decompress
+from paddleaudio.utils import download_and_decompress
 from utils.utility import download
+from utils.utility import unpack
 
 __all__ = ['VoxCeleb1']
 
@@ -60,12 +63,13 @@ class VoxCeleb1(Dataset):
     ]
     archieves_meta = [
         {
-            'url': 'https://www.robots.ox.ac.uk/~vgg/data/voxceleb/meta/veri_test2.txt',
-            'md5': 'b73110731c9223c1461fe49cb48dddfc',
+            'url':
+            'https://www.robots.ox.ac.uk/~vgg/data/voxceleb/meta/veri_test2.txt',
+            'md5':
+            'b73110731c9223c1461fe49cb48dddfc',
         },
     ]
 
-
     num_speakers = 1211  # 1211 vox1, 5994 vox2, 7205 vox1+2, test speakers: 41
     sample_rate = 16000
     meta_info = collections.namedtuple(
@@ -74,15 +78,16 @@ class VoxCeleb1(Dataset):
     wav_path = os.path.join(base_path, 'wav')
     subsets = ['train', 'dev', 'enrol', 'test']
 
-    def __init__(self,
-                 subset: str = 'train',
-                 feat_type: str = 'raw',
-                 random_chunk: bool = True,
-                 chunk_duration: float = 3.0,       # seconds
-                 split_ratio: float = 0.9,          # train split ratio
-                 seed: int = 0,
-                 target_dir: str = None,
-                 **kwargs):
+    def __init__(
+            self,
+            subset: str='train',
+            feat_type: str='raw',
+            random_chunk: bool=True,
+            chunk_duration: float=3.0,  # seconds
+            split_ratio: float=0.9,  # train split ratio
+            seed: int=0,
+            target_dir: str=None,
+            **kwargs):
 
         assert subset in self.subsets, \
             'Dataset subset must be one in {}, but got {}'.format(self.subsets, subset)
@@ -95,8 +100,12 @@ class VoxCeleb1(Dataset):
         self.chunk_duration = chunk_duration
         self.split_ratio = split_ratio
         self.target_dir = target_dir if target_dir else self.base_path
-        self.csv_path = os.path.join(target_dir, 'csv') if target_dir else os.path.join(self.base_path, 'csv')
-        self.meta_path = os.path.join(target_dir, 'meta') if target_dir else os.path.join(base_path, 'meta')
+        self.csv_path = os.path.join(
+            target_dir, 'csv') if target_dir else os.path.join(self.base_path,
+                                                               'csv')
+        self.meta_path = os.path.join(
+            target_dir, 'meta') if target_dir else os.path.join(base_path,
+                                                                'meta')
         self.veri_test_file = os.path.join(self.meta_path, 'veri_test2.txt')
         # self._data = self._get_data()[:1000]  # KP: Small dataset test.
         self._data = self._get_data()
@@ -112,10 +121,14 @@ class VoxCeleb1(Dataset):
         print("wav base path: {}".format(self.wav_path))
         if not os.path.isdir(self.wav_path):
             print("start to download the voxceleb1 dataset")
-            download_and_decompress(    # multi-zip parts concatenate to vox1_dev_wav.zip
-                self.archieves_audio_dev, self.base_path, decompress=False)
-            download_and_decompress(    # download the vox1_test_wav.zip and unzip
-                self.archieves_audio_test, self.base_path, decompress=True)
+            download_and_decompress(  # multi-zip parts concatenate to vox1_dev_wav.zip
+                self.archieves_audio_dev,
+                self.base_path,
+                decompress=False)
+            download_and_decompress(  # download the vox1_test_wav.zip and unzip
+                self.archieves_audio_test,
+                self.base_path,
+                decompress=True)
 
             # Download all parts and concatenate the files into one zip file.
             dev_zipfile = os.path.join(self.base_path, 'vox1_dev_wav.zip')
@@ -131,7 +144,7 @@ class VoxCeleb1(Dataset):
         if not os.path.isdir(self.meta_path):
             download_and_decompress(
                 self.archieves_meta, self.meta_path, decompress=False)
-        
+
         # Data preparation.
         if not os.path.isdir(self.csv_path):
             os.makedirs(self.csv_path)
@@ -143,8 +156,9 @@ class VoxCeleb1(Dataset):
                 audio_id, duration, wav, start, stop, spk_id = line.strip(
                 ).split(',')
                 data.append(
-                    self.meta_info(audio_id, float(duration), wav, int(start),
-                                   int(stop), spk_id))
+                    self.meta_info(audio_id,
+                                   float(duration), wav,
+                                   int(start), int(stop), spk_id))
 
         with open(os.path.join(self.meta_path, 'spk_id2label.txt'), 'r') as f:
             for line in f.readlines():
@@ -228,14 +242,16 @@ class VoxCeleb1(Dataset):
     def generate_csv(self,
                      wav_files: List[str],
                      output_file: str,
-                     split_chunks: bool = True):
+                     split_chunks: bool=True):
         print(f'Generating csv: {output_file}')
         header = ["id", "duration", "wav", "start", "stop", "spk_id"]
 
         with Pool(64) as p:
             infos = list(
                 tqdm(
-                    p.imap(lambda x: self._get_audio_info(x, split_chunks), wav_files), total=len(wav_files)))
+                    p.imap(lambda x: self._get_audio_info(x, split_chunks),
+                           wav_files),
+                    total=len(wav_files)))
 
         csv_lines = []
         for info in infos:
@@ -272,35 +288,39 @@ class VoxCeleb1(Dataset):
         audio_files = []
         speakers = set()
         for path in [self.wav_path]:
-            for file in glob.glob(os.path.join(path, "**", "*.wav"), recursive=True):
+            for file in glob.glob(
+                    os.path.join(path, "**", "*.wav"), recursive=True):
                 spk = file.split('/wav/')[1].split('/')[0]
                 if spk in test_spks:
                     continue
                 speakers.add(spk)
                 audio_files.append(file)
 
-        print("start to generate the {}".format(os.path.join(self.meta_path, 'spk_id2label.txt')))
+        print("start to generate the {}".format(
+            os.path.join(self.meta_path, 'spk_id2label.txt')))
         # encode the train and dev speakers label to spk_id2label.txt
         with open(os.path.join(self.meta_path, 'spk_id2label.txt'), 'w') as f:
-            for label, spk_id in enumerate(sorted(speakers)):  # 1211 vox1, 5994 vox2, 7205 vox1+2
+            for label, spk_id in enumerate(
+                    sorted(speakers)):  # 1211 vox1, 5994 vox2, 7205 vox1+2
                 f.write(f'{spk_id} {label}\n')
 
         audio_files = sorted(audio_files)
         random.shuffle(audio_files)
         split_idx = int(self.split_ratio * len(audio_files))
         # split_ratio to train
-        train_files, dev_files = audio_files[:split_idx], audio_files[split_idx:]
-
-        self.generate_csv(train_files, 
-                          os.path.join(self.csv_path, 'train.csv'))
-        self.generate_csv(dev_files, 
-                          os.path.join(self.csv_path, 'dev.csv'))
-        self.generate_csv(enrol_files,
-                          os.path.join(self.csv_path, 'enrol.csv'),
-                          split_chunks=False)
-        self.generate_csv(test_files,
-                          os.path.join(self.csv_path, 'test.csv'),
-                          split_chunks=False)
+        train_files, dev_files = audio_files[:split_idx], audio_files[
+            split_idx:]
+
+        self.generate_csv(train_files, os.path.join(self.csv_path, 'train.csv'))
+        self.generate_csv(dev_files, os.path.join(self.csv_path, 'dev.csv'))
+        self.generate_csv(
+            enrol_files,
+            os.path.join(self.csv_path, 'enrol.csv'),
+            split_chunks=False)
+        self.generate_csv(
+            test_files,
+            os.path.join(self.csv_path, 'test.csv'),
+            split_chunks=False)
 
     def __getitem__(self, idx):
         return self._convert_to_record(idx)
diff --git a/examples/voxceleb/sv0/local/train.py b/examples/voxceleb/sv0/local/train.py
index e8619cca..c0cb1e17 100644
--- a/examples/voxceleb/sv0/local/train.py
+++ b/examples/voxceleb/sv0/local/train.py
@@ -1,5 +1,20 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
 import argparse
+
 import paddle
+
 from dataset.voxceleb.voxceleb1 import VoxCeleb1
 
 
@@ -14,12 +29,13 @@ def main(args):
     # stage2: data prepare
     train_ds = VoxCeleb1('train', target_dir=args.data_dir)
 
+
 if __name__ == "__main__":
     # yapf: disable
     parser = argparse.ArgumentParser(__doc__)
-    parser.add_argument('--device', 
-                        choices=['cpu', 'gpu'], 
-                        default="cpu", 
+    parser.add_argument('--device',
+                        choices=['cpu', 'gpu'],
+                        default="cpu",
                         help="Select which device to train model, defaults to gpu.")
     parser.add_argument("--data-dir",
                         default="./data/",
@@ -28,4 +44,4 @@ if __name__ == "__main__":
     args = parser.parse_args()
     # yapf: enable
 
-    main(args)
\ No newline at end of file
+    main(args)
diff --git a/examples/voxceleb/sv0/run.sh b/examples/voxceleb/sv0/run.sh
index c24cbff4..a8debfc6 100755
--- a/examples/voxceleb/sv0/run.sh
+++ b/examples/voxceleb/sv0/run.sh
@@ -5,6 +5,6 @@ export PPAUDIO_HOME=/home/users/xiongxinlei/exprts/v3
 dir=./data/
 mkdir -p ${dir}
 # you can set the variable DATA_HOME to specifiy the downloaded the vox1 and vox2 dataset
-/home/users/xiongxinlei/.conda/envs/xxl_base/bin/python3 \
+python3 \
      local/train.py \
-     --data-dir ${dir}
\ No newline at end of file
+     --data-dir ${dir}
-- 
GitLab