File size: 822 Bytes
0d80816
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
# Copyright (c) 2023 Amphion.
#
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree.

from frechet_audio_distance import FrechetAudioDistance


def extract_fad(
    audio_dir1,
    audio_dir2,
    mode="vggish",
    use_pca=False,
    use_activation=False,
    verbose=False,
):
    """Extract Frechet Audio Distance for two given audio folders.
    audio_dir1: path to the ground truth audio folder.
    audio_dir2: path to the predicted audio folder.
    mode: "vggish", "pann", "clap" for different models.
    """
    frechet = FrechetAudioDistance(
        model_name=mode,
        use_pca=use_pca,
        use_activation=use_activation,
        verbose=verbose,
    )

    fad_score = frechet.score(audio_dir1, audio_dir2)

    return fad_score