Spaces:
Runtime error
Runtime error
Hugo Flores Garcia
commited on
Commit
·
d48dcc4
1
Parent(s):
b9277bd
upgrade to new codec ckpt
Browse files- Dockerfile +1 -0
- conf/vampnet-c2f.yml +4 -5
- conf/vampnet.yml +7 -7
- requirements.txt +2 -0
Dockerfile
CHANGED
|
@@ -13,6 +13,7 @@ RUN pip install --upgrade -r requirements.txt
|
|
| 13 |
RUN pip install --upgrade tensorflow
|
| 14 |
RUN pip install --upgrade librosa
|
| 15 |
RUN pip install --upgrade numba
|
|
|
|
| 16 |
ENV PYTHONPATH "$PYTHONPATH:/u/home/src"
|
| 17 |
ENV NUMBA_CACHE_DIR=/tmp/
|
| 18 |
|
|
|
|
| 13 |
RUN pip install --upgrade tensorflow
|
| 14 |
RUN pip install --upgrade librosa
|
| 15 |
RUN pip install --upgrade numba
|
| 16 |
+
RUN pip install protobuf==3.20
|
| 17 |
ENV PYTHONPATH "$PYTHONPATH:/u/home/src"
|
| 18 |
ENV NUMBA_CACHE_DIR=/tmp/
|
| 19 |
|
conf/vampnet-c2f.yml
CHANGED
|
@@ -1,15 +1,14 @@
|
|
| 1 |
$include:
|
| 2 |
- conf/vampnet.yml
|
| 3 |
|
| 4 |
-
VampNet.n_codebooks:
|
| 5 |
-
VampNet.n_conditioning_codebooks:
|
| 6 |
|
| 7 |
VampNet.embedding_dim: 1280
|
| 8 |
VampNet.n_layers: 16
|
| 9 |
VampNet.n_heads: 20
|
| 10 |
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
test/AudioDataset.duration: 3
|
| 14 |
|
| 15 |
AudioDataset.loudness_cutoff: -40.0
|
|
|
|
| 1 |
$include:
|
| 2 |
- conf/vampnet.yml
|
| 3 |
|
| 4 |
+
VampNet.n_codebooks: 14
|
| 5 |
+
VampNet.n_conditioning_codebooks: 4
|
| 6 |
|
| 7 |
VampNet.embedding_dim: 1280
|
| 8 |
VampNet.n_layers: 16
|
| 9 |
VampNet.n_heads: 20
|
| 10 |
|
| 11 |
+
AudioDataset.duration: 3.0
|
| 12 |
+
|
|
|
|
| 13 |
|
| 14 |
AudioDataset.loudness_cutoff: -40.0
|
conf/vampnet.yml
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
|
| 2 |
-
codec_ckpt: /u/home/src/runs/codec-ckpt/
|
| 3 |
save_path: ckpt
|
| 4 |
max_epochs: 1000
|
| 5 |
epoch_length: 1000
|
|
@@ -26,11 +26,12 @@ NoamScheduler.factor: 2.0
|
|
| 26 |
NoamScheduler.warmup: 10000
|
| 27 |
|
| 28 |
VampNet.vocab_size: 1024
|
| 29 |
-
VampNet.n_codebooks:
|
| 30 |
VampNet.n_conditioning_codebooks: 0
|
| 31 |
-
VampNet.r_cond_dim:
|
|
|
|
| 32 |
VampNet.embedding_dim: 1280
|
| 33 |
-
VampNet.n_layers:
|
| 34 |
VampNet.n_heads: 20
|
| 35 |
VampNet.flash_attn: false
|
| 36 |
VampNet.dropout: 0.05
|
|
@@ -40,17 +41,16 @@ AudioDataset.loudness_cutoff: -30.0
|
|
| 40 |
AudioDataset.without_replacement: true
|
| 41 |
AudioLoader.shuffle: true
|
| 42 |
|
| 43 |
-
|
|
|
|
| 44 |
train/AudioDataset.n_examples: 10000000
|
| 45 |
train/AudioLoader.sources:
|
| 46 |
- /data/spotdl/audio/train
|
| 47 |
|
| 48 |
-
val/AudioDataset.duration: 5.0
|
| 49 |
val/AudioDataset.n_examples: 2000
|
| 50 |
val/AudioLoader.sources:
|
| 51 |
- /data/spotdl/audio/val
|
| 52 |
|
| 53 |
-
test/AudioDataset.duration: 5.0
|
| 54 |
test/AudioDataset.n_examples: 1000
|
| 55 |
test/AudioLoader.sources:
|
| 56 |
- /data/spotdl/audio/test
|
|
|
|
| 1 |
|
| 2 |
+
codec_ckpt: /u/home/src/runs/codec-ckpt/lac-768x.pth
|
| 3 |
save_path: ckpt
|
| 4 |
max_epochs: 1000
|
| 5 |
epoch_length: 1000
|
|
|
|
| 26 |
NoamScheduler.warmup: 10000
|
| 27 |
|
| 28 |
VampNet.vocab_size: 1024
|
| 29 |
+
VampNet.n_codebooks: 4
|
| 30 |
VampNet.n_conditioning_codebooks: 0
|
| 31 |
+
VampNet.r_cond_dim: 0
|
| 32 |
+
VampNet.noise_mode: mask
|
| 33 |
VampNet.embedding_dim: 1280
|
| 34 |
+
VampNet.n_layers: 20
|
| 35 |
VampNet.n_heads: 20
|
| 36 |
VampNet.flash_attn: false
|
| 37 |
VampNet.dropout: 0.05
|
|
|
|
| 41 |
AudioDataset.without_replacement: true
|
| 42 |
AudioLoader.shuffle: true
|
| 43 |
|
| 44 |
+
AudioDataset.duration: 10.0
|
| 45 |
+
|
| 46 |
train/AudioDataset.n_examples: 10000000
|
| 47 |
train/AudioLoader.sources:
|
| 48 |
- /data/spotdl/audio/train
|
| 49 |
|
|
|
|
| 50 |
val/AudioDataset.n_examples: 2000
|
| 51 |
val/AudioLoader.sources:
|
| 52 |
- /data/spotdl/audio/val
|
| 53 |
|
|
|
|
| 54 |
test/AudioDataset.n_examples: 1000
|
| 55 |
test/AudioLoader.sources:
|
| 56 |
- /data/spotdl/audio/test
|
requirements.txt
CHANGED
|
@@ -4,6 +4,8 @@ rich
|
|
| 4 |
audiotools @ git+https://github.com/descriptinc/lyrebird-audiotools.git@hf/backup-info
|
| 5 |
lac @ git+https://github.com/descriptinc/lyrebird-audio-codec.git@hf/vampnet-temp
|
| 6 |
wavebeat @ git+https://github.com/hugofloresgarcia/wavebeat.git
|
|
|
|
|
|
|
| 7 |
tqdm
|
| 8 |
tensorboard
|
| 9 |
google-cloud-logging==2.2.0
|
|
|
|
| 4 |
audiotools @ git+https://github.com/descriptinc/lyrebird-audiotools.git@hf/backup-info
|
| 5 |
lac @ git+https://github.com/descriptinc/lyrebird-audio-codec.git@hf/vampnet-temp
|
| 6 |
wavebeat @ git+https://github.com/hugofloresgarcia/wavebeat.git
|
| 7 |
+
torch==1.13.1
|
| 8 |
+
torchaudio==0.13.1
|
| 9 |
tqdm
|
| 10 |
tensorboard
|
| 11 |
google-cloud-logging==2.2.0
|