Spaces:
Sleeping
Sleeping
Hugo Flores Garcia
commited on
Commit
•
d48dcc4
1
Parent(s):
b9277bd
upgrade to new codec ckpt
Browse files- Dockerfile +1 -0
- conf/vampnet-c2f.yml +4 -5
- conf/vampnet.yml +7 -7
- requirements.txt +2 -0
Dockerfile
CHANGED
@@ -13,6 +13,7 @@ RUN pip install --upgrade -r requirements.txt
|
|
13 |
RUN pip install --upgrade tensorflow
|
14 |
RUN pip install --upgrade librosa
|
15 |
RUN pip install --upgrade numba
|
|
|
16 |
ENV PYTHONPATH "$PYTHONPATH:/u/home/src"
|
17 |
ENV NUMBA_CACHE_DIR=/tmp/
|
18 |
|
|
|
13 |
RUN pip install --upgrade tensorflow
|
14 |
RUN pip install --upgrade librosa
|
15 |
RUN pip install --upgrade numba
|
16 |
+
RUN pip install protobuf==3.20
|
17 |
ENV PYTHONPATH "$PYTHONPATH:/u/home/src"
|
18 |
ENV NUMBA_CACHE_DIR=/tmp/
|
19 |
|
conf/vampnet-c2f.yml
CHANGED
@@ -1,15 +1,14 @@
|
|
1 |
$include:
|
2 |
- conf/vampnet.yml
|
3 |
|
4 |
-
VampNet.n_codebooks:
|
5 |
-
VampNet.n_conditioning_codebooks:
|
6 |
|
7 |
VampNet.embedding_dim: 1280
|
8 |
VampNet.n_layers: 16
|
9 |
VampNet.n_heads: 20
|
10 |
|
11 |
-
|
12 |
-
|
13 |
-
test/AudioDataset.duration: 3
|
14 |
|
15 |
AudioDataset.loudness_cutoff: -40.0
|
|
|
1 |
$include:
|
2 |
- conf/vampnet.yml
|
3 |
|
4 |
+
VampNet.n_codebooks: 14
|
5 |
+
VampNet.n_conditioning_codebooks: 4
|
6 |
|
7 |
VampNet.embedding_dim: 1280
|
8 |
VampNet.n_layers: 16
|
9 |
VampNet.n_heads: 20
|
10 |
|
11 |
+
AudioDataset.duration: 3.0
|
12 |
+
|
|
|
13 |
|
14 |
AudioDataset.loudness_cutoff: -40.0
|
conf/vampnet.yml
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
|
2 |
-
codec_ckpt: /u/home/src/runs/codec-ckpt/
|
3 |
save_path: ckpt
|
4 |
max_epochs: 1000
|
5 |
epoch_length: 1000
|
@@ -26,11 +26,12 @@ NoamScheduler.factor: 2.0
|
|
26 |
NoamScheduler.warmup: 10000
|
27 |
|
28 |
VampNet.vocab_size: 1024
|
29 |
-
VampNet.n_codebooks:
|
30 |
VampNet.n_conditioning_codebooks: 0
|
31 |
-
VampNet.r_cond_dim:
|
|
|
32 |
VampNet.embedding_dim: 1280
|
33 |
-
VampNet.n_layers:
|
34 |
VampNet.n_heads: 20
|
35 |
VampNet.flash_attn: false
|
36 |
VampNet.dropout: 0.05
|
@@ -40,17 +41,16 @@ AudioDataset.loudness_cutoff: -30.0
|
|
40 |
AudioDataset.without_replacement: true
|
41 |
AudioLoader.shuffle: true
|
42 |
|
43 |
-
|
|
|
44 |
train/AudioDataset.n_examples: 10000000
|
45 |
train/AudioLoader.sources:
|
46 |
- /data/spotdl/audio/train
|
47 |
|
48 |
-
val/AudioDataset.duration: 5.0
|
49 |
val/AudioDataset.n_examples: 2000
|
50 |
val/AudioLoader.sources:
|
51 |
- /data/spotdl/audio/val
|
52 |
|
53 |
-
test/AudioDataset.duration: 5.0
|
54 |
test/AudioDataset.n_examples: 1000
|
55 |
test/AudioLoader.sources:
|
56 |
- /data/spotdl/audio/test
|
|
|
1 |
|
2 |
+
codec_ckpt: /u/home/src/runs/codec-ckpt/lac-768x.pth
|
3 |
save_path: ckpt
|
4 |
max_epochs: 1000
|
5 |
epoch_length: 1000
|
|
|
26 |
NoamScheduler.warmup: 10000
|
27 |
|
28 |
VampNet.vocab_size: 1024
|
29 |
+
VampNet.n_codebooks: 4
|
30 |
VampNet.n_conditioning_codebooks: 0
|
31 |
+
VampNet.r_cond_dim: 0
|
32 |
+
VampNet.noise_mode: mask
|
33 |
VampNet.embedding_dim: 1280
|
34 |
+
VampNet.n_layers: 20
|
35 |
VampNet.n_heads: 20
|
36 |
VampNet.flash_attn: false
|
37 |
VampNet.dropout: 0.05
|
|
|
41 |
AudioDataset.without_replacement: true
|
42 |
AudioLoader.shuffle: true
|
43 |
|
44 |
+
AudioDataset.duration: 10.0
|
45 |
+
|
46 |
train/AudioDataset.n_examples: 10000000
|
47 |
train/AudioLoader.sources:
|
48 |
- /data/spotdl/audio/train
|
49 |
|
|
|
50 |
val/AudioDataset.n_examples: 2000
|
51 |
val/AudioLoader.sources:
|
52 |
- /data/spotdl/audio/val
|
53 |
|
|
|
54 |
test/AudioDataset.n_examples: 1000
|
55 |
test/AudioLoader.sources:
|
56 |
- /data/spotdl/audio/test
|
requirements.txt
CHANGED
@@ -4,6 +4,8 @@ rich
|
|
4 |
audiotools @ git+https://github.com/descriptinc/lyrebird-audiotools.git@hf/backup-info
|
5 |
lac @ git+https://github.com/descriptinc/lyrebird-audio-codec.git@hf/vampnet-temp
|
6 |
wavebeat @ git+https://github.com/hugofloresgarcia/wavebeat.git
|
|
|
|
|
7 |
tqdm
|
8 |
tensorboard
|
9 |
google-cloud-logging==2.2.0
|
|
|
4 |
audiotools @ git+https://github.com/descriptinc/lyrebird-audiotools.git@hf/backup-info
|
5 |
lac @ git+https://github.com/descriptinc/lyrebird-audio-codec.git@hf/vampnet-temp
|
6 |
wavebeat @ git+https://github.com/hugofloresgarcia/wavebeat.git
|
7 |
+
torch==1.13.1
|
8 |
+
torchaudio==0.13.1
|
9 |
tqdm
|
10 |
tensorboard
|
11 |
google-cloud-logging==2.2.0
|