asteroid-team · mpariente · Feb 6, 2021 · Feb 2, 2021 · Feb 2, 2021 · Feb 2, 2021
diff --git a/asteroid/models/base_models.py b/asteroid/models/base_models.py
@@ -1,5 +1,6 @@
 import torch
 import warnings
+from typing import Optional
 
 from .. import separate
 from ..masknn import activations
@@ -22,20 +23,24 @@ def _unsqueeze_to_3d(x):
 class BaseModel(torch.nn.Module):
     """Base class for serializable models.
 
-    Defines saving/loading procedures as well as separation methods from
-    file, torch tensors and numpy arrays.
-    Need to overwrite the `forward` method, the `sample_rate` property and
-    the `get_model_args` method.
+    Defines saving/loading procedures, and separation interface to `separate`.
+    Need to overwrite the `forward` and `get_model_args` methods.
 
     Models inheriting from `BaseModel` can be used by :mod:`asteroid.separate`
     and by the `asteroid-infer` CLI. For models whose `forward` doesn't go from
     waveform to waveform tensors, overwrite `forward_wav` to return
     waveform tensors.
+
+    Args:
+        sample_rate (float): Operating sample rate of the model.
+        n_channels: Supported number of channels of the model.
+            If None, no checks will be performed.
     """
 
-    def __init__(self, sample_rate: float = 8000.0):
+    def __init__(self, sample_rate: float = 8000.0, n_channels: Optional[int] = 1):
         super().__init__()
         self.__sample_rate = sample_rate
+        self.n_channels = n_channels
 
     def forward(self, *args, **kwargs):
         raise NotImplementedError

diff --git a/asteroid/separate.py b/asteroid/separate.py
@@ -19,7 +19,9 @@ class Protocol:
 class Separatable(Protocol):
     """Things that are separatable."""
 
-    def forward_wav(self, wav, **kwargs):
+    n_channels: int
+
+    def forward_wav(self, wav: torch.Tensor, **kwargs) -> torch.Tensor:
         """
         Args:
             wav (torch.Tensor): waveform tensor.
@@ -34,7 +36,7 @@ def forward_wav(self, wav, **kwargs):
         ...
 
     @property
-    def sample_rate(self):
+    def sample_rate(self) -> float:
         """Operating sample rate of the model (float)."""
         ...
 
@@ -88,6 +90,11 @@ def separate(
 @torch.no_grad()
 def torch_separate(model: Separatable, wav: torch.Tensor, **kwargs) -> torch.Tensor:
     """Core logic of `separate`."""
+    if model.n_channels is not None and wav.shape[-2] != model.n_channels:
+        raise RuntimeError(
+            f"Model supports {model.n_channels}-channel inputs but found audio with {wav.shape[-2]} channels."
+            f"Please match the number of channels."
+        )
     # Handle device placement
     input_device = get_device(wav, default="cpu")
     model_device = get_device(model, default="cpu")
@@ -159,7 +166,7 @@ def file_separate(
             f"of {model.sample_rate}Hz. You can pass `resample=True` to resample automatically."
         )
     # Pass wav as [batch, n_chan, time]; here: [1, 1, time]
-    wav = wav[:, 0][None, None]
+    wav = wav.T[None]
     (est_srcs,) = numpy_separate(model, wav, **kwargs)
     # Resample to original sr
     est_srcs = [

diff --git a/tests/models/models_test.py b/tests/models/models_test.py
@@ -32,6 +32,24 @@ def test_set_sample_rate_raises_warning():
         model.sample_rate = 16000.0
 
 
+def test_multichannel_model_loading():
+    class MCModel(BaseModel):
+        def __init__(self, sample_rate=8000.0, n_channels=2):
+            super().__init__(sample_rate=sample_rate, n_channels=n_channels)
+
+        def forward(self, x, **kwargs):
+            return x
+
+        def get_model_args(self):
+            return {"sample_rate": self.sample_rate, "n_channels": self.n_channels}
+
+    model = MCModel()
+    model_conf = model.serialize()
+
+    new_model = MCModel.from_pretrained(model_conf)
+    assert model.n_channels == new_model.n_channels
+
+
 def test_convtasnet_sep():
     nnet = ConvTasNet(
         n_src=2,