File size: 543 Bytes
92740f3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
clap_config:
  method: microsoft-clap
  audio_embed_dim: 1024
  config_root: ./ms_clap/src/configs
  model_name: 'clapcap'
  checkpoint: ./clapcap_weights_2023.pth
  window_length: 7.0
  window_overlap: 5.25
  max_num_window: 16
  max_num_fewshot: 4

model_config:
  cache_dir: None
  lang_encoder_path: facebook/opt-iml-max-1.3b
  tokenizer_path: facebook/opt-iml-max-1.3b
  cross_attn_every_n_layers: 1
  audio_transformer_kwargs: {
    n_head: 8,
    n_layers: 3,
    d_inner: 2048,
    max_num_media: 128,
    max_window_per_audio: 16,
  }