paddleaudio.datasets.voxceleb module

class paddleaudio.datasets.voxceleb.VoxCeleb(subset: str = 'train', feat_type: str = 'raw', random_chunk: bool = True, chunk_duration: float = 3.0, split_ratio: float = 0.9, seed: int = 0, target_dir: Optional[str] = None, vox2_base_path=None, **kwargs)[source]

Bases: Dataset

Methods

meta_info

alias of META_INFO

generate_csv

prepare_data

archieves_audio_dev = [{'url': 'https://thor.robots.ox.ac.uk/~vgg/data/voxceleb/vox1a/vox1_dev_wav_partaa', 'md5': 'e395d020928bc15670b570a21695ed96'}, {'url': 'https://thor.robots.ox.ac.uk/~vgg/data/voxceleb/vox1a/vox1_dev_wav_partab', 'md5': 'bbfaaccefab65d82b21903e81a8a8020'}, {'url': 'https://thor.robots.ox.ac.uk/~vgg/data/voxceleb/vox1a/vox1_dev_wav_partac', 'md5': '017d579a2a96a077f40042ec33e51512'}, {'url': 'https://thor.robots.ox.ac.uk/~vgg/data/voxceleb/vox1a/vox1_dev_wav_partad', 'md5': '7bb1e9f70fddc7a678fa998ea8b3ba19'}]
archieves_audio_test = [{'url': 'https://thor.robots.ox.ac.uk/~vgg/data/voxceleb/vox1a/vox1_test_wav.zip', 'md5': '185fdc63c3c739954633d50379a3d102'}]
archieves_meta = [{'url': 'https://www.robots.ox.ac.uk/~vgg/data/voxceleb/meta/veri_test2.txt', 'md5': 'b73110731c9223c1461fe49cb48dddfc'}]
base_path = '/home/docs/.paddleaudio/datasets/vox1'
csv_path = '/home/docs/.paddleaudio/datasets/vox1/csv'
generate_csv(wav_files: List[str], output_file: str, split_chunks: bool = True)[source]
meta_info

alias of META_INFO

meta_path = '/home/docs/.paddleaudio/datasets/vox1/meta'
num_speakers = 1211
prepare_data()[source]
sample_rate = 16000
source_url = 'https://thor.robots.ox.ac.uk/~vgg/data/voxceleb/vox1a/'
subsets = ['train', 'dev', 'enroll', 'test']
veri_test_file = '/home/docs/.paddleaudio/datasets/vox1/meta/veri_test2.txt'
wav_path = '/home/docs/.paddleaudio/datasets/vox1/wav'