Hugo Flores Garcia commited on
Commit
d48dcc4
1 Parent(s): b9277bd

upgrade to new codec ckpt

Browse files
Files changed (4) hide show
  1. Dockerfile +1 -0
  2. conf/vampnet-c2f.yml +4 -5
  3. conf/vampnet.yml +7 -7
  4. requirements.txt +2 -0
Dockerfile CHANGED
@@ -13,6 +13,7 @@ RUN pip install --upgrade -r requirements.txt
13
  RUN pip install --upgrade tensorflow
14
  RUN pip install --upgrade librosa
15
  RUN pip install --upgrade numba
 
16
  ENV PYTHONPATH "$PYTHONPATH:/u/home/src"
17
  ENV NUMBA_CACHE_DIR=/tmp/
18
 
 
13
  RUN pip install --upgrade tensorflow
14
  RUN pip install --upgrade librosa
15
  RUN pip install --upgrade numba
16
+ RUN pip install protobuf==3.20
17
  ENV PYTHONPATH "$PYTHONPATH:/u/home/src"
18
  ENV NUMBA_CACHE_DIR=/tmp/
19
 
conf/vampnet-c2f.yml CHANGED
@@ -1,15 +1,14 @@
1
  $include:
2
  - conf/vampnet.yml
3
 
4
- VampNet.n_codebooks: 9
5
- VampNet.n_conditioning_codebooks: 3
6
 
7
  VampNet.embedding_dim: 1280
8
  VampNet.n_layers: 16
9
  VampNet.n_heads: 20
10
 
11
- train/AudioDataset.duration: 3
12
- val/AudioDataset.duration: 3
13
- test/AudioDataset.duration: 3
14
 
15
  AudioDataset.loudness_cutoff: -40.0
 
1
  $include:
2
  - conf/vampnet.yml
3
 
4
+ VampNet.n_codebooks: 14
5
+ VampNet.n_conditioning_codebooks: 4
6
 
7
  VampNet.embedding_dim: 1280
8
  VampNet.n_layers: 16
9
  VampNet.n_heads: 20
10
 
11
+ AudioDataset.duration: 3.0
12
+
 
13
 
14
  AudioDataset.loudness_cutoff: -40.0
conf/vampnet.yml CHANGED
@@ -1,5 +1,5 @@
1
 
2
- codec_ckpt: /u/home/src/runs/codec-ckpt/codec.pth
3
  save_path: ckpt
4
  max_epochs: 1000
5
  epoch_length: 1000
@@ -26,11 +26,12 @@ NoamScheduler.factor: 2.0
26
  NoamScheduler.warmup: 10000
27
 
28
  VampNet.vocab_size: 1024
29
- VampNet.n_codebooks: 3
30
  VampNet.n_conditioning_codebooks: 0
31
- VampNet.r_cond_dim: 64
 
32
  VampNet.embedding_dim: 1280
33
- VampNet.n_layers: 16
34
  VampNet.n_heads: 20
35
  VampNet.flash_attn: false
36
  VampNet.dropout: 0.05
@@ -40,17 +41,16 @@ AudioDataset.loudness_cutoff: -30.0
40
  AudioDataset.without_replacement: true
41
  AudioLoader.shuffle: true
42
 
43
- train/AudioDataset.duration: 5.0
 
44
  train/AudioDataset.n_examples: 10000000
45
  train/AudioLoader.sources:
46
  - /data/spotdl/audio/train
47
 
48
- val/AudioDataset.duration: 5.0
49
  val/AudioDataset.n_examples: 2000
50
  val/AudioLoader.sources:
51
  - /data/spotdl/audio/val
52
 
53
- test/AudioDataset.duration: 5.0
54
  test/AudioDataset.n_examples: 1000
55
  test/AudioLoader.sources:
56
  - /data/spotdl/audio/test
 
1
 
2
+ codec_ckpt: /u/home/src/runs/codec-ckpt/lac-768x.pth
3
  save_path: ckpt
4
  max_epochs: 1000
5
  epoch_length: 1000
 
26
  NoamScheduler.warmup: 10000
27
 
28
  VampNet.vocab_size: 1024
29
+ VampNet.n_codebooks: 4
30
  VampNet.n_conditioning_codebooks: 0
31
+ VampNet.r_cond_dim: 0
32
+ VampNet.noise_mode: mask
33
  VampNet.embedding_dim: 1280
34
+ VampNet.n_layers: 20
35
  VampNet.n_heads: 20
36
  VampNet.flash_attn: false
37
  VampNet.dropout: 0.05
 
41
  AudioDataset.without_replacement: true
42
  AudioLoader.shuffle: true
43
 
44
+ AudioDataset.duration: 10.0
45
+
46
  train/AudioDataset.n_examples: 10000000
47
  train/AudioLoader.sources:
48
  - /data/spotdl/audio/train
49
 
 
50
  val/AudioDataset.n_examples: 2000
51
  val/AudioLoader.sources:
52
  - /data/spotdl/audio/val
53
 
 
54
  test/AudioDataset.n_examples: 1000
55
  test/AudioLoader.sources:
56
  - /data/spotdl/audio/test
requirements.txt CHANGED
@@ -4,6 +4,8 @@ rich
4
  audiotools @ git+https://github.com/descriptinc/lyrebird-audiotools.git@hf/backup-info
5
  lac @ git+https://github.com/descriptinc/lyrebird-audio-codec.git@hf/vampnet-temp
6
  wavebeat @ git+https://github.com/hugofloresgarcia/wavebeat.git
 
 
7
  tqdm
8
  tensorboard
9
  google-cloud-logging==2.2.0
 
4
  audiotools @ git+https://github.com/descriptinc/lyrebird-audiotools.git@hf/backup-info
5
  lac @ git+https://github.com/descriptinc/lyrebird-audio-codec.git@hf/vampnet-temp
6
  wavebeat @ git+https://github.com/hugofloresgarcia/wavebeat.git
7
+ torch==1.13.1
8
+ torchaudio==0.13.1
9
  tqdm
10
  tensorboard
11
  google-cloud-logging==2.2.0