Christian J. Steinmetz commited on
Commit
fb0aa71
·
1 Parent(s): e4fc05d

adding dataset download script

Browse files
Files changed (1) hide show
  1. scripts/download.py +58 -0
scripts/download.py ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import sys
3
+ import glob
4
+ import torch
5
+ import argparse
6
+
7
+
8
+ def download_zip_dataset(dataset_url: str, output_dir: str):
9
+ zip_filename = os.path.basename(dataset_url)
10
+ zip_name = zip_filename.replace(".zip", "")
11
+ os.system(f"wget -P {output_dir} {dataset_url}")
12
+ os.system(
13
+ f"""unzip {os.path.join(output_dir, zip_filename)} -d {os.path.join(output_dir, zip_name)}"""
14
+ )
15
+ os.system(f"rm {os.path.join(output_dir, zip_filename)}")
16
+
17
+
18
+ def process_dataset(dataset_dir: str, output_dir: str):
19
+ if dataset_dir == "VocalSet1-2":
20
+ pass
21
+ elif dataset_dir == "audio_mono-mic":
22
+ pass
23
+ elif dataset_dir == "IDMT-SMT-GUITAR_V2":
24
+ pass
25
+ elif dataset_dir == "IDMT-SMT-BASS":
26
+ pass
27
+ elif dataset_dir == "IDMT-SMT-DRUMS-V2":
28
+ pass
29
+ else:
30
+ raise NotImplemented(f"Invalid dataset_dir = {dataset_dir}.")
31
+
32
+
33
+ if __name__ == "__main__":
34
+ parser = argparse.ArgumentParser()
35
+ parser.add_argument(
36
+ "dataset_names",
37
+ choices=[
38
+ "vocalset",
39
+ "guitarset",
40
+ "idmt-smt-guitar",
41
+ "idmt-smt-bass",
42
+ "idmt-smt-drums",
43
+ ],
44
+ nargs="+",
45
+ )
46
+ args = parser.parse_args()
47
+
48
+ dataset_urls = {
49
+ "vocalset": "https://zenodo.org/record/1442513/files/VocalSet1-2.zip",
50
+ "guitarset": "https://zenodo.org/record/3371780/files/audio_mono-mic.zip",
51
+ "IDMT-SMT-GUITAR_V2": "https://zenodo.org/record/7544110/files/IDMT-SMT-GUITAR_V2.zip",
52
+ "IDMT-SMT-BASS": "https://zenodo.org/record/7188892/files/IDMT-SMT-BASS.zip",
53
+ "IDMT-SMT-DRUMS-V2": "https://zenodo.org/record/7544164/files/IDMT-SMT-DRUMS-V2.zip",
54
+ }
55
+
56
+ for dataset_name, dataset_url in dataset_urls.items():
57
+ if dataset_name in args.dataset_names:
58
+ download_zip_dataset(dataset_url, "~/data/remfx-data")