PommesPeter commited on
Commit
0e8bfde
1 Parent(s): 28a4b5f

added audio model

Browse files
CLAP/CLAP_weights_2022.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b917c47fec10547b65cf1d9096e194896fa1c2d6180536c8524289721a4c5b8
3
+ size 2333972488
CLAP/config.yml ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # TEXT ENCODER CONFIG
2
+ text_model: 'bert-base-uncased'
3
+ text_len: 100
4
+ transformer_embed_dim: 768
5
+ freeze_text_encoder_weights: True
6
+
7
+ # AUDIO ENCODER CONFIG
8
+ audioenc_name: 'Cnn14'
9
+ out_emb: 2048
10
+ sampling_rate: 44100
11
+ duration: 5
12
+ fmin: 50
13
+ fmax: 14000
14
+ n_fft: 1028
15
+ hop_size: 320
16
+ mel_bins: 64
17
+ window_size: 1024
18
+
19
+ # PROJECTION SPACE CONFIG
20
+ d_proj: 1024
21
+ temperature: 0.003
22
+
23
+ # TRAINING AND EVALUATION CONFIG
24
+ num_classes: 527
25
+ batch_size: 1024
26
+ demo: False
audio_generation/484.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f359e9ea8bcc511637585a475a31972bedc77751e5656fb6a6597995dcb6b8a
3
+ size 7768056443
bigvnat/args.yml ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ resblock: '1'
2
+ num_gpus: 0
3
+ batch_size: 64
4
+ num_mels: 80
5
+ learning_rate: 0.0001
6
+ adam_b1: 0.8
7
+ adam_b2: 0.99
8
+ lr_decay: 0.999
9
+ seed: 1234
10
+ upsample_rates:
11
+ - 4
12
+ - 4
13
+ - 2
14
+ - 2
15
+ - 2
16
+ - 2
17
+ upsample_kernel_sizes:
18
+ - 8
19
+ - 8
20
+ - 4
21
+ - 4
22
+ - 4
23
+ - 4
24
+ upsample_initial_channel: 1536
25
+ resblock_kernel_sizes:
26
+ - 3
27
+ - 7
28
+ - 11
29
+ resblock_dilation_sizes:
30
+ - - 1
31
+ - 3
32
+ - 5
33
+ - - 1
34
+ - 3
35
+ - 5
36
+ - - 1
37
+ - 3
38
+ - 5
39
+ activation: snakebeta
40
+ snake_logscale: true
41
+ resolutions:
42
+ - - 1024
43
+ - 120
44
+ - 600
45
+ - - 2048
46
+ - 240
47
+ - 1200
48
+ - - 512
49
+ - 50
50
+ - 240
51
+ mpd_reshapes:
52
+ - 2
53
+ - 3
54
+ - 5
55
+ - 7
56
+ - 11
57
+ use_spectral_norm: false
58
+ discriminator_channel_mult: 1
59
+ num_workers: 4
60
+ dist_config:
61
+ dist_backend: nccl
62
+ dist_url: tcp://localhost:54341
63
+ world_size: 1
bigvnat/best_netG.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:970ca75ee4d5ce583e9396a4534acb14971ea2b4f1c22e038f476680c868a789
3
+ size 449217313
maa2/maa2.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7621db6654b1a96398cf20edd6bc783ba8b7d4bc074e2ac42d609f0426480f19
3
+ size 7308070914