# Save loudness normalized (-14 LUFS) musdb-XL audio files for evaluations of de-limiter import os import argparse import tqdm import musdb import soundfile as sf import librosa import pyloudnorm as pyln from utils import db2linear, str2bool tqdm.monitor_interval = 0 def main(): parser = argparse.ArgumentParser(description="model test.py") parser.add_argument( "--target", type=str, default="mixture", help="target source. all, vocals, drums, bass, other", ) parser.add_argument("--data_root", type=str, default="/path/to/musdb_XL") parser.add_argument( "--data_root_hq", type=str, default="/path/to/musdb18hq", help="this is used when saving loud-norm stem of musdb-XL") parser.add_argument( "--output_directory", type=str, default="/path/to/musdb_XL_loudnorm", ) parser.add_argument( "--loudnorm_input_lufs", type=float, default=-14.0, help="If you want to use loudnorm, input target lufs", ) parser.add_argument( "--save_16k_mono", type=str2bool, default=True, help="Save 16k mono wav files for FAD evaluation.", ) args, _ = parser.parse_known_args() os.makedirs(args.output_directory, exist_ok=True) meter = pyln.Meter(44100) test_tracks = musdb.DB(root=args.data_root, subsets="test", is_wav=True) if args.target != "mixture": hq_tracks = musdb.DB(root=args.data_root_hq, subsets='test', is_wav=True) for idx, track in tqdm.tqdm(enumerate(test_tracks)): track_name = track.name if ( os.path.basename(args.data_root) == "musdb18hq" and track_name == "PR - Oh No" ): # We have to consider this exception because 'PR - Oh No' mixture.wav is left-panned. We will use the linear mixture instead. # Please refer https://github.com/jeonchangbin49/musdb-XL/blob/main/make_L_and_XL.py track_audio = ( track.targets["vocals"].audio + track.targets["drums"].audio + track.targets["bass"].audio + track.targets["other"].audio ) else: track_audio = track.audio print(track_name) augmented_gain = None track_lufs = meter.integrated_loudness(track_audio) augmented_gain = args.loudnorm_input_lufs - track_lufs if os.path.basename(args.data_root) == "musdb18hq": if args.target != "mixture": track_audio = track.targets[args.target].audio track_audio = track_audio * db2linear(augmented_gain, eps=0.0) elif os.path.basename(args.data_root) == "musdb_XL": track_audio = track_audio * db2linear(augmented_gain, eps=0.0) if args.target != "mixture": hq_track = hq_tracks[idx] hq_audio = hq_track.audio hq_stem = hq_track.targets[args.target].audio samplewise_gain = track_audio / (hq_audio + 1e-8) track_audio = samplewise_gain * hq_stem os.makedirs(f"{args.output_directory}/{track_name}", exist_ok=True) sf.write( f"{args.output_directory}/{track_name}/{args.target}.wav", track_audio, 44100 ) if args.save_16k_mono: track_audio_16k_mono = librosa.to_mono(track_audio.T) track_audio_16k_mono = librosa.resample( track_audio_16k_mono, orig_sr=44100, target_sr=16000, ) os.makedirs(f"{args.output_directory}_16k_mono/{track_name}", exist_ok=True) sf.write( f"{args.output_directory}_16k_mono/{track_name}/{args.target}.wav", track_audio_16k_mono, samplerate=16000, ) if __name__ == "__main__": main()