ai2cm · mcgibbon · Mar 11, 2026 · Mar 11, 2026 · Mar 11, 2026 · Mar 11, 2026
diff --git a/fme/core/registry/__init__.py b/fme/core/registry/__init__.py
@@ -1,3 +1,4 @@
 from .corrector import CorrectorSelector
 from .module import ModuleSelector
 from .registry import Registry
+from .separated_module import SeparatedModuleSelector
diff --git a/fme/core/registry/separated_module.py b/fme/core/registry/separated_module.py
@@ -0,0 +1,271 @@
+import abc
+import dataclasses
+from collections.abc import Callable, Mapping
+
+# we use Type to distinguish from type attr of SeparatedModuleSelector
+from typing import Any, ClassVar, Type  # noqa: UP035
+
+import dacite
+import torch
+from torch import nn
+
+from fme.core.dataset_info import DatasetInfo
+from fme.core.labels import BatchLabels, LabelEncoding
+
+from .module import CONDITIONAL_BUILDERS, ModuleSelector
+from .registry import Registry
+
+
+@dataclasses.dataclass
+class SeparatedModuleConfig(abc.ABC):
+    """
+    Builds an nn.Module that takes separate forcing and prognostic tensors
+    as input, and returns separate prognostic and diagnostic tensors as output.
+
+    The built nn.Module must have the forward signature:
+        forward(forcing: Tensor, prognostic: Tensor) -> tuple[Tensor, Tensor]
+    where the return value is (prognostic_out, diagnostic_out).
+    """
+
+    @abc.abstractmethod
+    def build(
+        self,
+        n_forcing_channels: int,
+        n_prognostic_channels: int,
+        n_diagnostic_channels: int,
+        dataset_info: DatasetInfo,
+    ) -> nn.Module:
+        """
+        Build a nn.Module with separated forcing/prognostic/diagnostic channels.
+
+        Args:
+            n_forcing_channels: number of input-only (forcing) channels
+            n_prognostic_channels: number of input-output (prognostic) channels
+            n_diagnostic_channels: number of output-only (diagnostic) channels
+            dataset_info: Information about the dataset, including img_shape,
+                horizontal coordinates, vertical coordinate, etc.
+
+        Returns:
+            An nn.Module whose forward method takes (forcing, prognostic) tensors
+            and returns (prognostic_out, diagnostic_out) tensors.
+        """
+        ...
+
+    @classmethod
+    def from_state(cls, state: Mapping[str, Any]) -> "SeparatedModuleConfig":
+        return dacite.from_dict(
+            data_class=cls, data=state, config=dacite.Config(strict=True)
+        )
+
+
+class SeparatedModule:
+    """
+    Wrapper around an nn.Module with separated channel interface.
+
+    The wrapped module takes (forcing, prognostic) tensors and returns
+    (prognostic_out, diagnostic_out) tensors. This wrapper handles
+    optional label encoding for conditional models.
+    """
+
+    def __init__(self, module: nn.Module, label_encoding: LabelEncoding | None):
+        self._module = module
+        self._label_encoding = label_encoding
+
+    def __call__(
+        self,
+        forcing: torch.Tensor,
+        prognostic: torch.Tensor,
+        labels: BatchLabels | None = None,
+    ) -> tuple[torch.Tensor, torch.Tensor]:
+        if labels is not None and self._label_encoding is None:
+            raise TypeError("Labels are not allowed for unconditional models")
+
+        if self._label_encoding is not None:
+            if labels is None:
+                raise TypeError("Labels are required for conditional models")
+            encoded_labels = labels.conform_to_encoding(self._label_encoding)
+            return self._module(forcing, prognostic, labels=encoded_labels.tensor)
+        else:
+            return self._module(forcing, prognostic)
+
+    @property
+    def torch_module(self) -> nn.Module:
+        return self._module
+
+    def get_state(self) -> dict[str, Any]:
+        if self._label_encoding is not None:
+            label_encoder_state = self._label_encoding.get_state()
+        else:
+            label_encoder_state = None
+        return {
+            **self._module.state_dict(),
+            "label_encoding": label_encoder_state,
+        }
+
+    def load_state(self, state: dict[str, Any]) -> None:
+        state = state.copy()
+        if state.get("label_encoding") is not None:
+            if self._label_encoding is None:
+                self._label_encoding = LabelEncoding.from_state(
+                    state.pop("label_encoding")
+                )
+            else:
+                self._label_encoding.conform_to_state(state.pop("label_encoding"))
+        state.pop("label_encoding", None)
+        self._module.load_state_dict(state)
+
+    def wrap_module(
+        self, callable: Callable[[nn.Module], nn.Module]
+    ) -> "SeparatedModule":
+        return SeparatedModule(callable(self._module), self._label_encoding)
+
+    def to(self, device: torch.device) -> "SeparatedModule":
+        return SeparatedModule(self._module.to(device), self._label_encoding)
+
+
+@dataclasses.dataclass
+class SeparatedModuleSelector:
+    """
+    A dataclass for building SeparatedModuleConfig instances from config dicts.
+
+    Mirrors ModuleSelector but for the separated channel interface.
+
+    Parameters:
+        type: the type of the SeparatedModuleConfig
+        config: data for a SeparatedModuleConfig instance of the indicated type
+        conditional: whether to condition the predictions on batch labels.
+    """
+
+    type: str
+    config: Mapping[str, Any]
+    conditional: bool = False
+    registry: ClassVar[Registry[SeparatedModuleConfig]] = Registry[
+        SeparatedModuleConfig
+    ]()
+
+    def __post_init__(self):
+        if not isinstance(self.registry, Registry):
+            raise ValueError(
+                "SeparatedModuleSelector.registry should not be set manually"
+            )
+        if self.conditional and self.type not in CONDITIONAL_BUILDERS:
+            raise ValueError(
+                "Conditional predictions require a conditional builder, "
+                f"got {self.type} (available: {CONDITIONAL_BUILDERS})"
+            )
+        self._instance = self.registry.get(self.type, self.config)
+
+    @property
+    def module_config(self) -> SeparatedModuleConfig:
+        return self._instance
+
+    @classmethod
+    def register(
+        cls, type_name: str
+    ) -> Callable[[Type[SeparatedModuleConfig]], Type[SeparatedModuleConfig]]:  # noqa: UP006
+        return cls.registry.register(type_name)
+
+    def build(
+        self,
+        n_forcing_channels: int,
+        n_prognostic_channels: int,
+        n_diagnostic_channels: int,
+        dataset_info: DatasetInfo,
+    ) -> SeparatedModule:
+        """
+        Build a SeparatedModule with separated forcing/prognostic/diagnostic
+        channels.
+
+        Args:
+            n_forcing_channels: number of input-only (forcing) channels
+            n_prognostic_channels: number of input-output (prognostic) channels
+            n_diagnostic_channels: number of output-only (diagnostic) channels
+            dataset_info: Information about the dataset, including img_shape.
+
+        Returns:
+            a SeparatedModule object
+        """
+        if self.conditional and len(dataset_info.all_labels) == 0:
+            raise ValueError("Conditional predictions require labels")
+        if self.conditional:
+            label_encoding = LabelEncoding(sorted(list(dataset_info.all_labels)))
+        else:
+            label_encoding = None
+        module = self._instance.build(
+            n_forcing_channels=n_forcing_channels,
+            n_prognostic_channels=n_prognostic_channels,
+            n_diagnostic_channels=n_diagnostic_channels,
+            dataset_info=dataset_info,
+        )
+        return SeparatedModule(module, label_encoding)
+
+    @classmethod
+    def get_available_types(cls):
+        return cls.registry._types.keys()
+
+
+class LegacyWrapper(nn.Module):
+    """Wraps an old-style (single tensor in/out) module for the separated
+    channel interface.
+
+    Input channels are ordered as [forcing, prognostic] and output channels
+    are ordered as [prognostic, diagnostic]. The inner module receives a
+    single concatenated input and produces a single concatenated output.
+    """
+
+    def __init__(
+        self,
+        inner: nn.Module,
+        n_prognostic_channels: int,
+    ):
+        super().__init__()
+        self.inner = inner
+        self._n_prognostic_channels = n_prognostic_channels
+
+    def forward(
+        self, forcing: torch.Tensor, prognostic: torch.Tensor
+    ) -> tuple[torch.Tensor, torch.Tensor]:
+        combined = torch.cat([forcing, prognostic], dim=-3)
+        output = self.inner(combined)
+        n = self._n_prognostic_channels
+        prog_out = output.narrow(-3, 0, n)
+        diag_out = output.narrow(-3, n, output.shape[-3] - n)
+        return prog_out, diag_out
+
+
+@SeparatedModuleSelector.register("legacy")
+@dataclasses.dataclass
+class LegacyModuleAdapter(SeparatedModuleConfig):
+    """
+    Adapter that wraps a legacy ModuleSelector module for the separated
+    channel interface.
+
+    Input channels are ordered as [forcing, prognostic] and output channels
+    are ordered as [prognostic, diagnostic].
+
+    Parameters:
+        legacy_builder: The legacy ModuleSelector for building the inner module.
+    """
+
+    legacy_builder: ModuleSelector
+
+    def build(
+        self,
+        n_forcing_channels: int,
+        n_prognostic_channels: int,
+        n_diagnostic_channels: int,
+        dataset_info: DatasetInfo,
+    ) -> nn.Module:
+        n_in = n_forcing_channels + n_prognostic_channels
+        n_out = n_prognostic_channels + n_diagnostic_channels
+
+        legacy_module = self.legacy_builder.build(
+            n_in_channels=n_in,
+            n_out_channels=n_out,
+            dataset_info=dataset_info,
+        )
+
+        return LegacyWrapper(
+            inner=legacy_module.torch_module,
+            n_prognostic_channels=n_prognostic_channels,
+        )