Chong Zhang commited on
Commit
ab60f0d
·
verified ·
1 Parent(s): eddcbf6
music_tokenizer/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "resblock": "1",
3
  "num_gpus": 8,
4
- "batch_size": 128,
5
  "learning_rate": 0.00002,
6
  "adam_b1": 0.5,
7
  "adam_b2": 0.9,
@@ -11,17 +11,17 @@
11
  "upsample_rates": [8,5,4,2],
12
  "upsample_kernel_sizes": [16,11,8,4],
13
  "upsample_initial_channel": 512,
14
- "resblock_kernel_sizes": [3,7,11],
15
- "resblock_dilation_sizes": [[1,3,5], [1,3,5], [1,3,5]],
16
 
17
- "segment_size": 24000,
18
- "num_mels": 128,
19
  "num_freq": 1024,
20
  "n_fft": 1024,
21
  "hop_size": 240,
22
  "win_size": 1024,
23
 
24
- "sampling_rate": 24000,
25
 
26
  "n_code_groups": 2,
27
  "n_codes": 1024,
@@ -29,10 +29,10 @@
29
  "commitment_loss_lambda": 0.25,
30
 
31
  "fmin": 0,
32
- "fmax": 12000,
33
  "fmax_for_loss": null,
34
 
35
- "num_workers": 32,
36
 
37
  "dist_config": {
38
  "dist_backend": "nccl",
@@ -40,4 +40,3 @@
40
  "world_size": 1
41
  }
42
  }
43
-
 
1
  {
2
  "resblock": "1",
3
  "num_gpus": 8,
4
+ "batch_size": 140,
5
  "learning_rate": 0.00002,
6
  "adam_b1": 0.5,
7
  "adam_b2": 0.9,
 
11
  "upsample_rates": [8,5,4,2],
12
  "upsample_kernel_sizes": [16,11,8,4],
13
  "upsample_initial_channel": 512,
14
+ "resblock_kernel_sizes": [3,5,7,9,11,13],
15
+ "resblock_dilation_sizes": [[1,3,5], [1,3,5], [1,3,5], [1,3,5], [1,3,5], [1,3,5]],
16
 
17
+ "segment_size": 48000,
18
+ "num_mels": 80,
19
  "num_freq": 1024,
20
  "n_fft": 1024,
21
  "hop_size": 240,
22
  "win_size": 1024,
23
 
24
+ "sampling_rate": 48000,
25
 
26
  "n_code_groups": 2,
27
  "n_codes": 1024,
 
29
  "commitment_loss_lambda": 0.25,
30
 
31
  "fmin": 0,
32
+ "fmax": 48000,
33
  "fmax_for_loss": null,
34
 
35
+ "num_workers": 24,
36
 
37
  "dist_config": {
38
  "dist_backend": "nccl",
 
40
  "world_size": 1
41
  }
42
  }
 
music_tokenizer/model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08d26564f725b5b4a38d0c9ea3d8d5e7df42173f15eeb4453930c2bfb93ef783
3
- size 254691363
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba71efdc50378baf9776d607eb11566907c3810e6f221c316719c02591135626
3
+ size 537087507