embedding / config.yaml
Hervé Bredin
feat: initial import 0faaae7
protocol: VoxCeleb.SpeakerVerification.VoxCeleb_X
patience: 5
task:
_target_: pyannote.audio.tasks.SupervisedRepresentationLearningWithArcFace
min_duration: 2
duration: 5.0
num_classes_per_batch: 64
num_chunks_per_class: 4
margin: 10.0
scale: 50.0
num_workers: 20
pin_memory: false
model:
_target_: pyannote.audio.models.embedding.XVectorSincNet
optimizer:
_target_: torch.optim.Adam
lr: 0.001
betas:
- 0.9
- 0.999
eps: 1.0e-08
weight_decay: 0
amsgrad: false
trainer:
_target_: pytorch_lightning.Trainer
accelerator: null
accumulate_grad_batches: 1
amp_backend: native
amp_level: O2
auto_lr_find: false
auto_scale_batch_size: false
auto_select_gpus: true
benchmark: false
check_val_every_n_epoch: 1
checkpoint_callback: true
deterministic: false
fast_dev_run: false
flush_logs_every_n_steps: 100
gpus: 1
gradient_clip_val: 0
limit_test_batches: 1.0
limit_train_batches: 1.0
limit_val_batches: 1.0
log_every_n_steps: 50
log_gpu_memory: null
max_epochs: 1000
max_steps: null
min_epochs: 1
min_steps: null
num_nodes: 1
num_processes: 1
num_sanity_val_steps: 2
overfit_batches: 0.0
precision: 32
prepare_data_per_node: true
process_position: 0
profiler: null
progress_bar_refresh_rate: 1
reload_dataloaders_every_epoch: false
replace_sampler_ddp: true
sync_batchnorm: false
terminate_on_nan: false
tpu_cores: null
track_grad_norm: -1
truncated_bptt_steps: null
val_check_interval: 1.0
weights_save_path: null
weights_summary: top
augmentation:
transform: Compose
params:
shuffle: false
transforms:
- transform: AddBackgroundNoise
params:
background_paths: /gpfswork/rech/eie/commun/data/background/musan
min_snr_in_db: 5.0
max_snr_in_db: 15.0
mode: per_example
p: 0.9
- transform: ApplyImpulseResponse
params:
ir_paths: /gpfswork/rech/eie/commun/data/rir
mode: per_example
p: 0.5