RemFx

Sleeping

App Files Files Community

Christian J. Steinmetz commited on Apr 20, 2023

Commit

1b6bb59

1 Parent(s): c756b1d

adding mixup augmentation and fixing ordering of labels

Browse files

Files changed (5) hide show

cfg/model/cls_panns_16k_mixup.yaml +16 -0
cfg/model/cls_panns_44k.yaml +5 -3
cfg/model/{cls_panns_44k_noaug.yaml → cls_panns_44k_mixup.yaml} +6 -4
cfg/model/cls_panns_pt_mixup.yaml +12 -0
remfx/models.py +43 -5

cfg/model/cls_panns_16k_mixup.yaml ADDED Viewed

	@@ -0,0 +1,16 @@

+# @package _global_
+model:
+  _target_: remfx.models.FXClassifier
+  lr: 3e-4
+  lr_weight_decay: 1e-3
+  sample_rate: ${sample_rate}
+  mixup: True
+  network:
+    _target_: remfx.classifier.Cnn14
+    num_classes: ${num_classes}
+    n_fft: 2048
+    hop_length: 512
+    n_mels: 128
+    sample_rate: 44100
+    model_sample_rate: 16000

cfg/model/cls_panns_44k.yaml CHANGED Viewed

@@ -4,12 +4,14 @@ model:
   lr: 3e-4
   lr_weight_decay: 1e-3
   sample_rate: ${sample_rate}
   network:
     _target_: remfx.classifier.Cnn14
     num_classes: ${num_classes}
-    n_fft: 1024
-    hop_length: 256
     n_mels: 128
     sample_rate: 44100
     model_sample_rate: 44100
-    specaugment: True

   lr: 3e-4
   lr_weight_decay: 1e-3
   sample_rate: ${sample_rate}
+  mixup: False
   network:
     _target_: remfx.classifier.Cnn14
     num_classes: ${num_classes}
+    n_fft: 2048
+    hop_length: 512
     n_mels: 128
     sample_rate: 44100
     model_sample_rate: 44100
+    specaugment: False

cfg/model/{cls_panns_44k_noaug.yaml → cls_panns_44k_mixup.yaml} RENAMED Viewed

@@ -4,12 +4,14 @@ model:
   lr: 3e-4
   lr_weight_decay: 1e-3
   sample_rate: ${sample_rate}
   network:
     _target_: remfx.classifier.Cnn14
     num_classes: ${num_classes}
-    n_fft: 1024
-    hop_length: 256
-    n_mels: 128
     sample_rate: 44100
     model_sample_rate: 44100
-    specaugment: False

   lr: 3e-4
   lr_weight_decay: 1e-3
   sample_rate: ${sample_rate}
+  mixup: True
   network:
     _target_: remfx.classifier.Cnn14
     num_classes: ${num_classes}
+    n_fft: 2048
+    hop_length: 512
+    n_mels: 64
     sample_rate: 44100
     model_sample_rate: 44100
+    specaugment: False

cfg/model/cls_panns_pt_mixup.yaml ADDED Viewed

	@@ -0,0 +1,12 @@

+# @package _global_
+model:
+  _target_: remfx.models.FXClassifier
+  lr: 3e-4
+  lr_weight_decay: 1e-3
+  sample_rate: ${sample_rate}
+  mixup: True
+  network:
+    _target_: remfx.classifier.PANNs
+    num_classes: ${num_classes}
+    sample_rate: ${sample_rate}

remfx/models.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import torch
 import torchmetrics
 import pytorch_lightning as pl
 from torch import Tensor, nn
@@ -409,6 +410,30 @@ class TCNModel(nn.Module):
         return output
 class FXClassifier(pl.LightningModule):
     def __init__(
         self,
@@ -416,13 +441,15 @@ class FXClassifier(pl.LightningModule):
         lr_weight_decay: float,
         sample_rate: float,
         network: nn.Module,
     ):
         super().__init__()
         self.lr = lr
         self.lr_weight_decay = lr_weight_decay
         self.sample_rate = sample_rate
         self.network = network
-        self.effects = ["distortion", "compressor", "reverb", "chorus", "delay"]
         self.train_f1 = torchmetrics.classification.MultilabelF1Score(
             5, average="none", multidim_average="global"
@@ -441,13 +468,24 @@ class FXClassifier(pl.LightningModule):
         }
     def forward(self, x: torch.Tensor, train: bool = False):
-        return self.network(x)
     def common_step(self, batch, batch_idx, mode: str = "train"):
         train = True if mode == "train" else False
         x, y, dry_label, wet_label = batch
-        pred_label = self(x, train)
-        loss = nn.functional.cross_entropy(pred_label, wet_label)
         self.log(
             f"{mode}_loss",
             loss,
@@ -458,7 +496,7 @@ class FXClassifier(pl.LightningModule):
             sync_dist=True,
         )
-        metrics = self.metrics[mode](pred_label, wet_label.long())
         avg_metrics = torch.mean(metrics)
         self.log(

 import torch
+import numpy as np
 import torchmetrics
 import pytorch_lightning as pl
 from torch import Tensor, nn
         return output
+def mixup(x: torch.Tensor, y: torch.Tensor, alpha: float = 1.0):
+    """Mixup data augmentation for time-domain signals.
+    Args:
+        x (torch.Tensor): Batch of time-domain signals, shape [batch, 1, time].
+        y (torch.Tensor): Batch of labels, shape [batch, n_classes].
+        alpha (float): Beta distribution parameter.
+    Returns:
+        torch.Tensor: Mixed time-domain signals, shape [batch, 1, time].
+        torch.Tensor: Mixed labels, shape [batch, n_classes].
+        torch.Tensor: Lambda
+    """
+    batch_size = x.size(0)
+    if alpha > 0:
+        lam = np.random.beta(alpha, alpha)
+    else:
+        lam = 1
+    index = torch.randperm(batch_size).to(x.device)
+    mixed_x = lam * x + (1 - lam) * x[index, :]
+    mixed_y = lam * y + (1 - lam) * y[index, :]
+    return mixed_x, mixed_y, lam
 class FXClassifier(pl.LightningModule):
     def __init__(
         self,
         lr_weight_decay: float,
         sample_rate: float,
         network: nn.Module,
+        mixup: bool = False,
     ):
         super().__init__()
         self.lr = lr
         self.lr_weight_decay = lr_weight_decay
         self.sample_rate = sample_rate
         self.network = network
+        self.effects = ["Reverb", "Chorus", "Delay", "Distortion", "Compressor"]
+        self.mixup = mixup
         self.train_f1 = torchmetrics.classification.MultilabelF1Score(
             5, average="none", multidim_average="global"
         }
     def forward(self, x: torch.Tensor, train: bool = False):
+        return self.network(x, train=train)
     def common_step(self, batch, batch_idx, mode: str = "train"):
         train = True if mode == "train" else False
         x, y, dry_label, wet_label = batch
+        if mode == "train" and self.mixup:
+            x_mixed, label_mixed, lam = mixup(x, wet_label)
+            pred_label = self(x_mixed, train)
+            loss = nn.functional.cross_entropy(pred_label, label_mixed)
+            print(torch.sigmoid(pred_label[0, ...]))
+            print(label_mixed[0, ...])
+        else:
+            pred_label = self(x, train)
+            loss = nn.functional.cross_entropy(pred_label, wet_label)
+            print(torch.where(torch.sigmoid(pred_label[0, ...]) > 0.5, 1.0, 0.0).long())
+            print(wet_label.long()[0, ...])
         self.log(
             f"{mode}_loss",
             loss,
             sync_dist=True,
         )
+        metrics = self.metrics[mode](torch.sigmoid(pred_label), wet_label.long())
         avg_metrics = torch.mean(metrics)
         self.log(