trttung1610's picture
Upload 233 files
19b5932
raw
history blame
618 Bytes
# @package __global__
# Setup for execute only on audiocaps for audio generation
# evaluation with objective metrics
# execute_only=evaluate
dataset:
max_audio_duration: null
# ensure the proper values are broadcasted here for evaluate
evaluate:
min_audio_duration: 1. # some metrics requires a minimum audio length
max_audio_duration: null # all samples from audiocaps should be ~10s
num_samples: null
segment_duration: null
generate:
min_audio_duration: 1.
max_audio_duration: null
num_samples: 500
evaluate:
metrics:
fad: true
kld: true
text_consistency: true