From fe2435a5a2dd0c5be38f1c2291a5aef8e4a5d871 Mon Sep 17 00:00:00 2001
From: dmarek <damian@flexcompute.com>
Date: Tue, 16 Sep 2025 07:50:17 -0400
Subject: [PATCH] add feature to orthogonalize degenerate modes from mode
 solver

add conjugate option for orthogonalizing degen modes
---
 tidy3d/components/data/monitor_data.py | 100 +++++++++++++++++++++++
 tidy3d/components/mode/solver.py       | 106 +++++++++++++++++++++++++
 2 files changed, 206 insertions(+)

diff --git a/tidy3d/components/data/monitor_data.py b/tidy3d/components/data/monitor_data.py
index bfd0a9a0df..8232feda4d 100644
--- a/tidy3d/components/data/monitor_data.py
+++ b/tidy3d/components/data/monitor_data.py
@@ -708,6 +708,27 @@ def flux(self) -> FluxDataArray:
         """Flux for data corresponding to a 2D monitor."""
         return self.complex_flux.real
 
+    @cached_property
+    def flux_yee(self) -> FluxDataArray:
+        """Flux for data corresponding to a 2D monitor."""
+
+        # Tangential fields are ordered as E1, E2, H1, H2
+        tan_fields = self._tangential_fields
+        dim1, dim2 = self._tangential_dims
+        e_x_h_pos1 = tan_fields["E" + dim1] * tan_fields["H" + dim2].conj()
+        e_x_h_pos2 = tan_fields["E" + dim2] * tan_fields["H" + dim1].conj()
+        cell_sizes = self.grid_expanded._primal_steps.to_dict
+        dual_cell_sizes = self.grid_expanded._dual_steps.to_dict
+        E1_H2_darea = np.outer(cell_sizes[dim1], dual_cell_sizes[dim2])
+        E2_H1_darea = np.outer(dual_cell_sizes[dim1], cell_sizes[dim2])
+
+        term1 = (e_x_h_pos1 * E1_H2_darea[:, :, np.newaxis, np.newaxis]).sum(dim=dim1).sum(dim=dim2)
+        term2 = (
+            -(e_x_h_pos2 * E2_H1_darea[:, :, np.newaxis, np.newaxis]).sum(dim=dim1).sum(dim=dim2)
+        )
+
+        return FluxDataArray((term1 + term2).real / 2)
+
     @cached_property
     def mode_area(self) -> FreqModeDataArray:
         r"""Effective mode area corresponding to a 2D monitor.
@@ -789,6 +810,85 @@ def dot(
 
         return ModeAmpsDataArray(0.25 * integrand.sum(dim=d_area.dims))
 
+    def dot_yee(
+        self, field_data: Union[FieldData, ModeData, ModeSolverData], conjugate: bool = True
+    ) -> ModeAmpsDataArray:
+        r"""Dot product (modal overlap) with another :class:`.FieldData` object. Both datasets have
+        to be frequency-domain data associated with a 2D monitor. Along the tangential directions,
+        the datasets have to have the same discretization. Along the normal direction, the monitor
+        position may differ and is ignored. Other coordinates (``frequency``, ``mode_index``) have
+        to be either identical or broadcastable. Broadcasting is also supported in the case in
+        which the other ``field_data`` has a dimension of size 1 whose coordinate is not in the list
+        of coordinates in the ``self`` dataset along the corresponding dimension. In that case, the
+        coordinates of the ``self`` dataset are used in the output.
+
+        The dot product is defined as:
+
+        .. math:
+
+           \frac{1}{4} \int \left( E_0 \times H_1^* + H_0^* \times E_1 \) \, {\rm d}S
+
+        Parameters
+        ----------
+        field_data : :class:`ElectromagneticFieldData`
+            A data instance to compute the dot product with.
+        conjugate : bool, optional
+            If ``True`` (default), the dot product is defined as above. If ``False``, the definition
+            is similar, but without the complex conjugation of the $H$ fields.
+
+        Note
+        ----
+            The dot product with and without conjugation is equivalent (up to a phase) for
+            modes in lossless waveguides but differs for modes in lossy materials. In that case,
+            the conjugated dot product can be interpreted as the fraction of the power of the first
+            mode carried by the second, but modes are not orthogonal with respect to that product
+            and the sum of carried power fractions may be different from the total flux.
+            In the non-conjugated definition, modes are orthogonal, but the interpretation of the
+            dot product power carried by a given mode is no longer valid.
+        """
+
+        # Tangential fields for current and other field data
+        # fields_self = self._colocated_tangential_fields
+        fields_self = self._tangential_fields
+        # fields_self = {key: field.isel(z=0, drop=True) for key, field in self.field_components.items()}
+
+        if conjugate:
+            fields_self = {key: field.conj() for key, field in fields_self.items()}
+
+        # fields_other = field_data._interpolated_tangential_fields(self._plane_grid_boundaries)
+        fields_other = field_data._tangential_fields
+
+        # Drop size-1 dimensions in the other data
+        fields_other = {key: field.squeeze(drop=True) for key, field in fields_other.items()}
+
+        # Cross products of fields
+        dim1, dim2 = self._tangential_dims
+
+        E1xH2 = (
+            fields_self["E" + dim1] * fields_other["H" + dim2]
+            + fields_self["H" + dim2] * fields_other["E" + dim1]
+        )
+        E2xH1 = (
+            fields_self["E" + dim2] * fields_other["H" + dim1]
+            + fields_self["H" + dim1] * fields_other["E" + dim2]
+        )
+
+        cell_sizes = self.grid_expanded._primal_steps.to_dict
+        dual_cell_sizes = self.grid_expanded._dual_steps.to_dict
+
+        E1_H2_dS = np.outer(cell_sizes[dim1], dual_cell_sizes[dim2])
+        E2_H1_dS = np.outer(dual_cell_sizes[dim1], cell_sizes[dim2])
+
+        term1 = (
+            (E1xH2[:, :, ...] * E1_H2_dS[:, :, np.newaxis, np.newaxis]).sum(dim=dim1).sum(dim=dim2)
+        )
+        term2 = (
+            -(E2xH1[:, :, ...] * E2_H1_dS[:, :, np.newaxis, np.newaxis]).sum(dim=dim1).sum(dim=dim2)
+        )
+
+        # return (term1 + term2) / 4
+        return ModeAmpsDataArray(0.25 * (term1 + term2))
+
     def _interpolated_tangential_fields(self, coords: ArrayFloat2D) -> dict[str, DataArray]:
         """For 2D monitors, interpolate this fields to given coords in the tangential plane.
 
diff --git a/tidy3d/components/mode/solver.py b/tidy3d/components/mode/solver.py
index afb4fc9671..a8ae764de7 100644
--- a/tidy3d/components/mode/solver.py
+++ b/tidy3d/components/mode/solver.py
@@ -18,6 +18,8 @@
 TOL_COMPLEX = 1e-10
 # Tolerance for eigs
 TOL_EIGS = fp_eps / 10
+# Tolerance for to consider modes as degenerate
+TOL_DEGENERATE = fp_eps * 10
 # Tolerance for deciding on the matrix to be diagonal or tensorial
 TOL_TENSORIAL = 1e-6
 # shift target neff by this value, both rel and abs, whichever results in larger shift
@@ -27,6 +29,9 @@
 # Good conductor permittivity cut-off value. Let it be as large as possible so long as not causing overflow in
 # double precision. This value is very heuristic.
 GOOD_CONDUCTOR_CUT_OFF = 1e70
+# Whether to apply additional post-processing to degenerate modes
+# in order to ensure that they are orthogonal with respect to the EM dot definition
+ORTHOGONALIZE_DEGENERATE_MODES = True
 
 if TYPE_CHECKING:
     from scipy import sparse as sp
@@ -54,6 +59,7 @@ def compute_modes(
         direction="+",
         solver_basis_fields=None,
         plane_center: Optional[tuple[float, float]] = None,
+        conjugated_dot_product: bool = True,
     ) -> tuple[Numpy, Numpy, EpsSpecType]:
         """
         Solve for the modes of a waveguide cross-section.
@@ -93,6 +99,9 @@ def compute_modes(
             The center of the mode plane along the tangential axes of the global simulation. Used
             in case of bend modes to offset the coordinates correctly w.r.t. the bend radius, which
             is assumed to refer to the distance from the bend center to the mode plane center.
+        conjugated_dot_product : bool
+            Definition used for the dot product of electromagnetic modes. Currently, only used when
+            building an orthogonal basis from any identified degenerate mode groups.
 
         Returns
         -------
@@ -285,6 +294,17 @@ def compute_modes(
         E = E.reshape((3, Nx, Ny, 1, num_modes))
         H = np.sum(jac_h[..., None] * H[:, None, ...], axis=0)
         H = H.reshape((3, Nx, Ny, 1, num_modes))
+
+        if ORTHOGONALIZE_DEGENERATE_MODES:
+            # Identify and post-process degenerate modes
+            degenerate_groups = cls.identify_degenerate_eigenvalues(
+                neff + keff * 1j, TOL_DEGENERATE
+            )
+            print(degenerate_groups)
+            E, H = cls.make_orthogonal_basis_for_degenerate_modes(
+                degenerate_groups, E, H, dl_f, dl_b, conjugated_dot_product=True
+            )
+
         fields = np.stack((E, H), axis=0)
 
         neff = neff * np.linalg.norm(kp_to_k)
@@ -628,6 +648,7 @@ def conditional_inverted_vec(eps_vec, threshold=1):
                 M=generalized_M,
                 basis_vecs=basis_vecs,
             )
+
         neff, keff = cls.eigs_to_effective_index(vals, mode_solver_type)
 
         # Sort by descending neff
@@ -1089,6 +1110,91 @@ def mode_plane_contain_good_conductor(material_response) -> bool:
             return False
         return np.any(np.abs(material_response) > GOOD_CONDUCTOR_THRESHOLD * np.abs(pec_val))
 
+    @staticmethod
+    def identify_degenerate_eigenvalues(
+        mode_indexes: np.ndarray,
+        tol: float,
+    ) -> list[tuple[int]]:
+        """Inspects mode indices to find groups of degenerate modes."""
+        num_modes = len(mode_indexes)
+        ungrouped = set(range(num_modes))
+        degenerate_groups = []
+
+        while ungrouped:
+            # Start a new group with an ungrouped column
+            seed = ungrouped.pop()
+            current_group = [seed]
+            # Find all columns similar to the seed of the current group
+            for col in list(ungrouped):
+                if np.isclose(mode_indexes[col], mode_indexes[seed], rtol=tol, atol=tol):
+                    current_group.append(col)
+                    ungrouped.remove(col)
+
+            # Only keep groups with more than one mode
+            if len(current_group) >= 2:
+                degenerate_groups.append(sorted(current_group))
+
+        return degenerate_groups
+
+    @staticmethod
+    def make_orthogonal_basis_for_degenerate_modes(
+        degenerate_groups: list[tuple[int]],
+        E_vec: np.ndarray,
+        H_vec: np.ndarray,
+        dl_primal: np.ndarray,
+        dl_dual: np.ndarray,
+        conjugated_dot_product: bool = True,
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """Ensures that groups of degenerate modes are orthogonal, which is not guaranteed for the eigenvectors
+        returned by scipy or the parallel versions of mode solvers."""
+        Ex = E_vec[0, ...]
+        Ey = E_vec[1, ...]
+        # Ez = E_vec[2, ...]
+
+        Hx = H_vec[0, ...]
+        Hy = H_vec[1, ...]
+        # Hz = H_vec[2, ...]
+
+        # Make the differential area elements, which are different for Ex(Hy) and Ey(Hx) on the Yee grid
+        Ex_Hy_dS = np.outer(dl_primal[0], dl_dual[1])
+        Ey_Hx_dS = np.outer(dl_dual[0], dl_primal[1])
+
+        def orthogonal_dot(mode_1: int, mode_2: int) -> complex:
+            """Discrete version of the modal overlap calculation."""
+            Ex_1 = Ex[..., mode_1]
+            Ey_1 = Ey[..., mode_1]
+            Hx_1 = Hx[..., mode_1]
+            Hy_1 = Hy[..., mode_1]
+            if conjugated_dot_product:
+                Ex_1 = Ex[..., mode_1].conj()
+                Ey_1 = Ey[..., mode_1].conj()
+                Hx_1 = Hx[..., mode_1].conj()
+                Hy_1 = Hy[..., mode_1].conj()
+
+            term1 = Ex_1 * Hy[..., mode_2] + Ex[..., mode_2] * Hy_1
+            term1 *= Ex_Hy_dS[..., np.newaxis]
+            term2 = Ey_1 * Hx[..., mode_2] + Ey[..., mode_2] * Hx_1
+            term2 *= Ey_Hx_dS[..., np.newaxis]
+            return np.sum(term1 - term2)
+
+        for degenerate_group in degenerate_groups:
+            num_degenerate_modes = len(degenerate_group)
+            # W is an overlap matrix of the degenerate modes, which should be normal
+            # where the left and right eigenvectors are the same.
+            W = np.zeros((num_degenerate_modes, num_degenerate_modes), dtype=E_vec.dtype)
+            for i in range(num_degenerate_modes):
+                for j in range(num_degenerate_modes):
+                    W[i, j] = orthogonal_dot(i, j)
+
+            # Eigenvectors of the overlap matrix correspond with an orthogonal basis composed of the
+            # raw modes
+            _, Q = np.linalg.eig(W)
+
+            E_vec[..., degenerate_group] = E_vec[..., degenerate_group] @ Q
+            H_vec[..., degenerate_group] = H_vec[..., degenerate_group] @ Q
+
+        return E_vec, H_vec
+
 
 def compute_modes(*args, **kwargs) -> tuple[Numpy, Numpy, str]:
     """A wrapper around ``EigSolver.compute_modes``, which is used in :class:`.ModeSolver`."""