Merge branch 'features/nonzero-updates' into merge_nonzero

brownbaerchen · brownbaerchen · commit b4a5329f05d7 · 2026-06-16T14:29:28.000+02:00
diff --git a/.github/workflows/array-api.yml b/.github/workflows/array-api.yml
@@ -17,7 +17,7 @@ jobs:
       with:
         path: heat
     - name: Setup MPI
-      uses: mpi4py/setup-mpi@dbbb80b116bea57fc1788daf7dbbf7ab3df3a0f1 # v1.4.2
+      uses: mpi4py/setup-mpi@f200dce75b64188be849b46657dcf86c721937b2 # v1.4.3
       with:
         mpi: ${{ matrix.mpi }}
     - name: Use Python ${{ matrix.python-version }}
diff --git a/.github/workflows/push_main.yml b/.github/workflows/push_main.yml
@@ -97,12 +97,12 @@ jobs:
     name: Check REUSE compliance
     steps:
       - name: Harden Runner
-        uses: step-security/harden-runner@a5ad31d6a139d249332a2605b85202e8c0b78450 # v2.19.1
+        uses: step-security/harden-runner@9af89fc71515a100421586dfdb3dc9c984fbf411 # v2.19.4
         with:
           egress-policy: audit
 
       - name: Checkout
-        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
+        uses: actions/checkout@df4cb1c069e1874edd31b4311f1884172cec0e10 # v6.0.3
 
       - name: Setup Python
         uses: actions/setup-python@a309ff8b426b58ec0e2a45f0f869d46889d02405 # v6.2.0
diff --git a/.github/workflows/weekly.yml b/.github/workflows/weekly.yml
@@ -30,11 +30,11 @@ jobs:
             uses: actions/checkout@df4cb1c069e1874edd31b4311f1884172cec0e10 # v6.0.3
             # Initializes the CodeQL tools for scanning.
           - name: Initialize CodeQL
-            uses: github/codeql-action/init@87557b9c84dde89fdd9b10e88954ac2f4248e463 # v4.36.1
+            uses: github/codeql-action/init@8aad20d150bbac5944a9f9d289da16a4b0d87c1e # v4.36.2
             with:
                 languages: python
           - name: Perform CodeQL Analysis
-            uses: github/codeql-action/analyze@87557b9c84dde89fdd9b10e88954ac2f4248e463 # v4.36.1
+            uses: github/codeql-action/analyze@8aad20d150bbac5944a9f9d289da16a4b0d87c1e # v4.36.2
             with:
                 category: "/language:python"
     scorecard:
@@ -83,7 +83,7 @@ jobs:
 
             # Upload the results to GitHub's code scanning dashboard.
           - name: "Upload to code-scanning"
-            uses: github/codeql-action/upload-sarif@87557b9c84dde89fdd9b10e88954ac2f4248e463 # v4.36.1
+            uses: github/codeql-action/upload-sarif@8aad20d150bbac5944a9f9d289da16a4b0d87c1e # v4.36.2
             with:
                 sarif_file: results.sarif
     check-links:
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -26,7 +26,7 @@ repos:
 
   - repo: https://github.com/astral-sh/ruff-pre-commit
     # Ruff version.
-    rev: v0.15.16
+    rev: v0.15.17
     hooks:
       # Run the linter.
       - id: ruff
diff --git a/heat/core/indexing.py b/heat/core/indexing.py
@@ -7,18 +7,18 @@
 from .communication import MPI
 from .dndarray import DNDarray
 from . import factories
+from .sanitation import sanitize_in
 from . import types
 from . import manipulations
-from . import sanitation
 
 __all__ = ["nonzero", "where"]
 
 
 def nonzero(x: DNDarray, as_tuple: bool = True) -> tuple[DNDarray, ...] | DNDarray:
     """
-    Return a Tuple of :class:`~heat.core.dndarray.DNDarray`s, one for each dimension of ``x``,
+    Return a tuple of :class:`~heat.core.dndarray.DNDarray`s, one for each dimension of ``x``,
     containing the indices of the non-zero elements in that dimension. If ``x`` is split then
-    the result is split in the 0th dimension. However, this :class:`~heat.core.dndarray.DNDarray`
+    the result is split in the first dimension. However, this :class:`~heat.core.dndarray.DNDarray`
     can be UNBALANCED as it contains the indices of the non-zero elements on each node.
     The values in ``x`` are always tested and returned in row-major, C-style order.
     The corresponding non-zero values can be obtained with: ``x[nonzero(x)]``.
@@ -54,29 +54,24 @@ def nonzero(x: DNDarray, as_tuple: bool = True) -> tuple[DNDarray, ...] | DNDarr
     >>> y[ht.nonzero(y > 3)]
     DNDarray([4, 5, 6, 7, 8, 9], dtype=ht.int64, device=cpu:0, split=0)
     """
-    sanitation.sanitize_in(x)
-    local_x = x.larray
+    sanitize_in(x)
 
     if not x.is_distributed():
         # nonzero indices as tuple
-        nonzero = torch.nonzero(input=local_x, as_tuple=as_tuple)
-        # ensure output split is consistent with distributed execution
-        out_split = 0 if x.split is not None else None
-
+        nonzero = torch.nonzero(input=x.larray, as_tuple=as_tuple)
         # bookkeeping for final DNDarray construct
         if as_tuple:
             nonzero = list(nonzero)
             for i, nz_tensor in enumerate(nonzero):
-                nonzero[i] = factories.array(
-                    nz_tensor, split=out_split, device=x.device, comm=x.comm
-                )
+                nonzero[i] = factories.array(nz_tensor, device=x.device, comm=x.comm)
             return tuple(nonzero)
-        # nonzero indices as single 2D DNDarray
-        return factories.array(nonzero, split=out_split, device=x.device, comm=x.comm)
+        else:
+            # nonzero indices as single 2D DNDarray
+            return factories.array(nonzero, device=x.device, comm=x.comm)
 
     # distributed case
-    lcl_nonzero = torch.nonzero(input=local_x, as_tuple=False)
-    nonzero_size = torch.tensor(lcl_nonzero.shape[0], dtype=torch.int64)
+    lcl_nonzero = torch.nonzero(input=x.larray, as_tuple=False)
+    nonzero_size = torch.tensor(lcl_nonzero.shape[0], dtype=torch.int64, device="cpu")
     nonzero_dtype = types.canonical_heat_type(lcl_nonzero.dtype)
 
     # global nonzero_size
@@ -85,7 +80,33 @@ def nonzero(x: DNDarray, as_tuple: bool = True) -> tuple[DNDarray, ...] | DNDarr
     _, displs = x.counts_displs()
     lcl_nonzero[:, x.split] += displs[x.comm.rank]
 
-    if x.split != 0:
+    if x.split == 0:
+        # for split=0, the local nonzero indices are already globally ordered along the split axis
+        if as_tuple:  # return indices as tuple of 1D DNDarrays
+            lcl_nonzero = lcl_nonzero.unbind(dim=1)
+            return tuple(
+                DNDarray(
+                    nz_tensor,
+                    gshape=(nonzero_size.item(),),
+                    dtype=nonzero_dtype,
+                    split=0,
+                    device=x.device,
+                    comm=x.comm,
+                    balanced=False,
+                )
+                for nz_tensor in lcl_nonzero
+            )
+        else:  # return indices as single 2D DNDarray
+            return DNDarray(
+                lcl_nonzero,
+                gshape=(nonzero_size.item(), x.ndim),
+                dtype=nonzero_dtype,
+                split=0,
+                device=x.device,
+                comm=x.comm,
+                balanced=False,
+            )
+    else:
         # construct global 2D DNDarray of nz indices:
         shape_2d = (nonzero_size.item(), x.ndim)
         global_nonzero = DNDarray(
@@ -100,59 +121,33 @@ def nonzero(x: DNDarray, as_tuple: bool = True) -> tuple[DNDarray, ...] | DNDarr
         # vectorized sorting of nz indices along axis 0
         global_nonzero.balance_()
         global_nonzero = manipulations.unique(global_nonzero, axis=0)
-        if not as_tuple:
-            # return indices as single 2D DNDarray
-            return global_nonzero
-        # return indices as tuple of 1D DNDarrays
-        lcl_nonzero = global_nonzero.larray.unbind(dim=1)
-        return tuple(
-            DNDarray(
-                nz_tensor,
-                gshape=(nonzero_size.item(),),
-                dtype=nonzero_dtype,
-                split=0,
-                device=x.device,
-                comm=x.comm,
-                balanced=True,
+        if as_tuple:  # return indices as tuple of 1D DNDarrays
+            lcl_nonzero = global_nonzero.larray.unbind(dim=1)
+            return tuple(
+                DNDarray(
+                    nz_tensor,
+                    gshape=(nonzero_size.item(),),
+                    dtype=nonzero_dtype,
+                    split=0,
+                    device=x.device,
+                    comm=x.comm,
+                    balanced=True,
+                )
+                for nz_tensor in lcl_nonzero
             )
-            for nz_tensor in lcl_nonzero
-        )
-
-    # for split=0, the local nonzero indices are already globally ordered along the split axis
-    if not as_tuple:
-        # return indices as single 2D DNDarray
-        return DNDarray(
-            lcl_nonzero,
-            gshape=(nonzero_size.item(), x.ndim),
-            dtype=nonzero_dtype,
-            split=0,
-            device=x.device,
-            comm=x.comm,
-            balanced=False,
-        )
-    # return indices as tuple of 1D DNDarrays
-    lcl_nonzero = lcl_nonzero.unbind(dim=1)
-    return tuple(
-        DNDarray(
-            nz_tensor,
-            gshape=(nonzero_size.item(),),
-            dtype=nonzero_dtype,
-            split=0,
-            device=x.device,
-            comm=x.comm,
-            balanced=False,
-        )
-        for nz_tensor in lcl_nonzero
-    )
+        else:  # return indices as single 2D DNDarray
+            return global_nonzero
 
 
 DNDarray.nonzero = lambda self: nonzero(self, as_tuple=True)
 DNDarray.nonzero.__doc__ = nonzero.__doc__
 
 
 def where(
-    cond: DNDarray, x: None | int | float | DNDarray = None, y: None | int | float | DNDarray = None
-) -> DNDarray | tuple[DNDarray, ...]:
+    cond: DNDarray,
+    x: None | int | float | DNDarray = None,
+    y: None | int | float | DNDarray = None,
+) -> DNDarray:
     """
     Return a :class:`~heat.core.dndarray.DNDarray` containing elements chosen from ``x`` or ``y`` depending on condition.
     Result is a :class:`~heat.core.dndarray.DNDarray` with elements from ``x`` where ``cond`` is True, and from ``y`` elsewhere.
@@ -161,24 +156,38 @@ def where(
 
     Parameters
     ----------
-    cond: DNDarray
-        When True, yield ``x``, otherwise yield ``y``.
-    x, y: DNDarray or scalar, optional
-        Values from which to choose. ``x``, ``y`` and ``cond`` must be broadcastable to some shape.
-        If ``x`` and ``y`` are distributed, they must have the same split axis as ``cond``.
+    cond : DNDarray
+        Condition of interest, where true yield ``x`` otherwise yield ``y``
+    x : DNDarray or int or float, optional
+        Values from which to choose. ``x``, ``y`` and condition need to be broadcastable to some shape.
+    y : DNDarray or int or float, optional
+        Values from which to choose. ``x``, ``y`` and condition need to be broadcastable to some shape.
+
+    Raises
+    ------
+    NotImplementedError
+        if splits of the two input :class:`~heat.core.dndarray.DNDarray` differ
+    TypeError
+        if only x or y is given or both are not DNDarrays or numerical scalars
+
+    Notes
+    -----
+    When only condition is provided, this function is a shorthand for :func:`nonzero` and the function returns a tuple
+    of :class:`~heat.core.dndarray.DNDarray`, analogously to ``numpy.where``.
 
     Examples
     --------
     >>> import heat as ht
     >>> x = ht.arange(10, split=0)
     >>> ht.where(x < 5, x, 10 * x)
-    DNDarray([ 0,  1,  2,  3,  4, 50, 60, 70, 80, 90], dtype=ht.int64, device=cpu:0, split=0)
-
-    >>> # Indices retrieval (shorthand for nonzero)
-    >>> y = ht.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]], split=0)
-    >>> ht.where(y > 3)
-    (DNDarray([1, 1, 1, 2, 2, 2], dtype=ht.int64, device=cpu:0, split=0),
-     DNDarray([0, 1, 2, 0, 1, 2], dtype=ht.int64, device=cpu:0, split=0))
+    DNDarray(MPI-rank: 0, Shape: (10,), Split: 0, Local Shape: (10,), Device: cpu:0, Dtype: int32, Data:
+         [ 0,  1,  2,  3,  4, 50, 60, 70, 80, 90])
+    >>> y = ht.array([[0, 1, 2], [0, 2, 4], [0, 3, 6]])
+    >>> ht.where(y < 4, y, -1)
+    DNDarray(MPI-rank: 0, Shape: (3, 3), Split: None, Local Shape: (3, 3), Device: cpu:0, Dtype: int64, Data:
+         [[ 0,  1,  2],
+          [ 0,  2, -1],
+          [ 0,  3, -1]])
     """
     # ---- binary where(cond, x, y) branch ------------------------------------
     if cond.split is not None and (isinstance(x, DNDarray) or isinstance(y, DNDarray)):
@@ -198,10 +207,8 @@ def where(
         return cond.dtype(cond == 0) * y + cond * x
 
     # ---- where(cond) "indices only" branch ----------------------------------
-    elif x is None and y is None:
-        # nonzero() properly handles all cases
-        nz = nonzero(cond)
-        return nz
+    elif x is None and y is None:  # delegate to nonzero(cond)
+        return nonzero(cond)  # tuple of DNDarrays, one per dimension
 
     # ---- invalid combinations ----------------------------------------------
     else:
diff --git a/heat/core/linalg/eigh.py b/heat/core/linalg/eigh.py
@@ -75,7 +75,7 @@ def _subspaceiteration(
             device=columnnorms.device,
         )
         * statistics.percentile(columnnorms, 100.0 * (1 - (k + safetyparam) / columnnorms.shape[0]))
-    )
+    )[0]
     X = C[:, idx].balance()
 
     # actual subspace iteration
diff --git a/tests/core/test_indexing.py b/tests/core/test_indexing.py

Original file line number	Diff line number	Diff line change
`@@ -75,7 +75,7 @@ def _subspaceiteration(`
`75`	`75`	`device=columnnorms.device,`
`76`	`76`	`)`
`77`	`77`	`* statistics.percentile(columnnorms, 100.0 * (1 - (k + safetyparam) / columnnorms.shape[0]))`
`78`		`- )`
	`78`	`+ )[0]`
`79`	`79`	`X = C[:, idx].balance()`
`80`	`80`
`81`	`81`	`# actual subspace iteration`