anthonyrusso's picture
upload dependencies
b57c851
raw
history blame
725 Bytes
# @package __global__
# Setup for execute only on audiocaps for audio generation
# evaluation with objective metrics
# execute_only=evaluate
dataset:
max_audio_duration: null
# ensure the proper values are broadcasted here for evaluate
evaluate:
min_audio_duration: 1. # some metrics requires a minimum audio length
max_audio_duration: null # all samples from audiocaps should be ~10s
num_samples: null
segment_duration: null
generate:
min_audio_duration: 1.
max_audio_duration: null
num_samples: 500
evaluate:
metrics:
fad: true
kld: true
text_consistency: true
metrics:
kld:
passt:
pretrained_length: 10 # similarly to reported results in AudioGen paper