ArgonneCPAC
diff --git a/‎.flake8‎
Lines changed: 0 additions & 6 deletions b/‎.flake8‎
Lines changed: 0 additions & 6 deletions
diff --git a/‎.github/workflows/pypi.yml‎
Lines changed: 4 additions & 4 deletions b/‎.github/workflows/pypi.yml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎.github/workflows/sphinx.yml‎
Lines changed: 4 additions & 4 deletions b/‎.github/workflows/sphinx.yml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎.github/workflows/tests.yml‎
Lines changed: 10 additions & 4 deletions b/‎.github/workflows/tests.yml‎
Lines changed: 10 additions & 4 deletions
diff --git a/‎docs/conf.py‎
Lines changed: 11 additions & 6 deletions b/‎docs/conf.py‎
Lines changed: 11 additions & 6 deletions
diff --git a/‎mpipartition/_send_home.py‎
Lines changed: 127 additions & 0 deletions b/‎mpipartition/_send_home.py‎
Lines changed: 127 additions & 0 deletions
diff --git a/‎mpipartition/distribute.py‎
Lines changed: 18 additions & 58 deletions b/‎mpipartition/distribute.py‎
Lines changed: 18 additions & 58 deletions
@@ -14,15 +14,15 @@ jobs:
     steps:
 
       - name: check out
-        uses: actions/checkout@v2
+        uses: actions/checkout@v4
         with:
           fetch-depth: 0
           lfs: true
 
       - name: Setup Python
-        uses: actions/setup-python@v2
+        uses: actions/setup-python@v5
         with:
-          python-version: 3.8
+          python-version: 3.11
 
       - name: Install MPI
         uses: mpi4py/setup-mpi@v1
@@ -38,7 +38,7 @@ jobs:
 
       - name: Load cached venv
         id: cached-poetry-dependencies
-        uses: actions/cache@v2
+        uses: actions/cache@v4
         with:
           path: .venv
           key: venv-${{ runner.os }}-${{ steps.setup-python.outputs.python-version }}-${{ hashFiles('**/pyproject.toml') }}
 
@@ -13,15 +13,15 @@ jobs:
     steps:
 
       - name: check out
-        uses: actions/checkout@v2
+        uses: actions/checkout@v4
         with:
           fetch-depth: 0
           lfs: true
 
       - name: Setup Python
-        uses: actions/setup-python@v2
+        uses: actions/setup-python@v5
         with:
-          python-version: 3.8
+          python-version: 3.11
 
       - name: Install MPI
         uses: mpi4py/setup-mpi@v1
@@ -37,7 +37,7 @@ jobs:
 
       - name: Load cached venv
         id: cached-poetry-dependencies
-        uses: actions/cache@v2
+        uses: actions/cache@v4
         with:
           path: .venv
           key: venv-${{ runner.os }}-${{ steps.setup-python.outputs.python-version }}-${{ hashFiles('**/pyproject.toml') }}
 
@@ -13,7 +13,7 @@ jobs:
       - name: Setup Python
         uses: actions/setup-python@v5
         with:
-          python-version: "3.9"
+          python-version: "3.11"
 
       - name: Install MPI
         uses: mpi4py/setup-mpi@v1
@@ -29,17 +29,23 @@ jobs:
 
       - name: Load cached venv
         id: cached-poetry-dependencies
-        uses: actions/cache@v2
+        uses: actions/cache@v4
         with:
           path: .venv
           key: venv-${{ runner.os }}-${{ steps.setup-python.outputs.python-version }}-${{ hashFiles('**/pyproject.toml') }}
 
       - name: Install dependencies
         if: steps.cached-poetry-dependencies.outputs.cache-hit != 'true'
-        run: poetry install --no-interaction --no-root
+        run: poetry install --no-interaction --no-root --all-extras
 
       - name: Install library
-        run: poetry install --no-interaction
+        run: poetry install --no-interaction --all-extras
+
+      - name: MyPy Type checking
+        run: poetry run mypy --config-file mypy.ini --show-error-codes
+
+      - name: Ruff Linting
+        run: poetry run ruff check
 
       - name: Run MPI tests 2 ranks
         run: |
 
@@ -17,14 +17,16 @@
 # relative to the documentation root, use os.path.abspath to make it
 # absolute, like shown here.
 #
-import os, sys, shutil, subprocess
+import os
+import sys
 import re
 from pathlib import Path
+from typing import TYPE_CHECKING
 
 DIR = Path(__file__).parent.resolve()
 sys.path.insert(0, os.path.abspath(".."))
 
-import mpipartition
+import mpipartition  # noqa: E402
 
 # -- General configuration ---------------------------------------------
 
@@ -128,7 +130,7 @@
 
 # -- Options for LaTeX output ------------------------------------------
 
-latex_elements = {
+latex_elements: dict[str, str] = {
     # The paper size ('letterpaper' or 'a4paper').
     #
     # 'papersize': 'letterpaper',
@@ -181,8 +183,11 @@
     ),
 ]
 
+if TYPE_CHECKING:
+    from sphinx.application import Sphinx
 
-def prepare(app):
+
+def prepare(app: Sphinx) -> None:
     with open(DIR.parent / "README.rst") as f:
         contents = f.read()
 
@@ -194,11 +199,11 @@ def prepare(app):
         f.write(contents)
 
 
-def clean_up(app, exception):
+def clean_up(app: Sphinx, exception: Exception) -> None:
     (DIR / "readme.rst").unlink()
 
 
-def setup(app):
+def setup(app: Sphinx) -> None:
     app.add_css_file("css/custom.css")
     # Copy the readme in
     app.connect("builder-inited", prepare)
 
@@ -0,0 +1,127 @@
+from __future__ import annotations
+import numpy as np
+from typing import TYPE_CHECKING
+from mpi4py import MPI
+import sys
+
+if TYPE_CHECKING:
+    from .partition import Partition
+    from .spherical_partition import S2Partition
+
+ParticleDataT = dict[str, np.ndarray]
+
+
+def distribute_dataset_by_home(
+    partition: Partition | S2Partition,
+    data: ParticleDataT,
+    home_idx: np.ndarray,
+    *,
+    verbose: int = 0,
+    verify_count: bool = True,
+    all2all_iterations: int = 1,
+) -> ParticleDataT:
+    total_to_send = len(home_idx)
+    nperiteration = total_to_send // all2all_iterations
+    data_new_list: list[ParticleDataT] = []
+
+    # Some general assertions that every rank has valid data
+    keys = list(data.keys())
+    keys_0 = partition.comm.bcast(keys, root=0)
+    assert len(keys) == len(keys_0)
+    assert all(k in keys_0 for k in keys)
+    dtype_string = "".join(data[k].dtype.char for k in keys_0)
+    dtype_string_0 = partition.comm.bcast(dtype_string, root=0)
+    assert dtype_string == dtype_string_0
+
+    for i in range(all2all_iterations):
+        start_idx = i * nperiteration
+        end_idx = (
+            (i + 1) * nperiteration if i < all2all_iterations - 1 else total_to_send
+        )
+        if partition.rank == 0 and verbose > 0:
+            print(f"  - Distributing particles iteration {i + 1}/{all2all_iterations}")
+        _data = {k: v[start_idx:end_idx] for k, v in data.items()}
+        _home_idx = home_idx[start_idx:end_idx]
+        _data = _distribute_dataset_by_home(
+            partition,
+            _data,
+            _home_idx,
+            keys_0,
+            verbose=verbose,
+            verify_count=verify_count,
+        )
+        data_new_list.append(_data)
+    # concatenate the data
+    data_new = {k: np.concatenate([d[k] for d in data_new_list]) for k in data.keys()}
+    return data_new
+
+
+def _distribute_dataset_by_home(
+    partition: Partition | S2Partition,
+    data: ParticleDataT,
+    home_idx: np.ndarray,
+    keys: list[str],
+    *,
+    verbose: int = 0,
+    verify_count: bool = True,
+) -> ParticleDataT:
+    total_to_send = len(home_idx)
+    for d in data.values():
+        assert len(d) == total_to_send, "All data arrays must have the same length"
+
+    # sort by rank
+    s = np.argsort(home_idx)
+    home_idx = home_idx[s]
+
+    # offsets and counts
+    send_displacements = np.searchsorted(home_idx, np.arange(partition.nranks))
+    send_displacements = send_displacements.astype(np.int32)
+    send_counts = np.append(send_displacements[1:], total_to_send) - send_displacements
+    send_counts = send_counts.astype(np.int32)
+
+    # announce to each rank how many objects will be sent
+    recv_counts = np.empty_like(send_counts)
+    partition.comm.Alltoall(send_counts, recv_counts)
+    recv_displacements = np.insert(np.cumsum(recv_counts)[:-1], 0, 0)
+
+    # number of objects that this rank will receive
+    total_to_receive = np.sum(recv_counts)
+
+    # debug message
+    if verbose > 1:
+        for i in range(partition.nranks):
+            if partition.rank == i:
+                print(f"Distribute Debug Rank {i}")
+                print(f" - rank has {total_to_send} particles")
+                print(f" - rank receives {total_to_receive} particles")
+                print(f" - send_counts:        {send_counts}")
+                print(f" - send_displacements: {send_displacements}")
+                print(f" - recv_counts:        {recv_counts}")
+                print(f" - recv_displacements: {recv_displacements}")
+                print("", flush=True)
+            partition.comm.Barrier()
+
+    # send data all-to-all, each array individually
+    data_new = {k: np.empty(total_to_receive, dtype=data[k].dtype) for k in data.keys()}
+
+    for k in keys:
+        d = data[k][s]
+        s_msg = [d, (send_counts, send_displacements), d.dtype.char]
+        r_msg = [data_new[k], (recv_counts, recv_displacements), d.dtype.char]
+        partition.comm.Alltoallv(s_msg, r_msg)
+
+    if verify_count:
+        key0 = keys[0]
+        local_counts = np.array([len(data[key0]), len(data_new[key0])], dtype=np.int64)
+        global_counts = np.empty_like(local_counts)
+        partition.comm.Reduce(local_counts, global_counts, op=MPI.SUM, root=0)
+        if partition.rank == 0 and global_counts[0] != global_counts[1]:
+            print(
+                f"Error in distribute: particle count during distribute was not "
+                f"maintained ({global_counts[0]} -> {global_counts[1]})",
+                file=sys.stderr,
+                flush=True,
+            )
+            partition.comm.Abort()
+
+    return data_new
@@ -1,11 +1,12 @@
 import sys
-from typing import List, Mapping, Union
+from typing import List, Union
 
 import numpy as np
 
-from .partition import MPI, Partition
+from .partition import Partition
+from ._send_home import distribute_dataset_by_home
 
-ParticleDataT = Mapping[str, np.ndarray]
+ParticleDataT = dict[str, np.ndarray]
 
 
 def distribute(
@@ -16,6 +17,7 @@ def distribute(
     *,
     verbose: Union[bool, int] = False,
     verify_count: bool = True,
+    all2all_iterations: int = 1,
 ) -> ParticleDataT:
     """Distribute data among MPI ranks according to data position and volume partition
 
@@ -46,6 +48,10 @@ def distribute(
     verify_count:
         If True, make sure that total number of objects is conserved
 
+    all2all_iterations:
+        The number of iterations to use for the all-to-all communication.
+        This is useful for large datasets, where MPI_Alltoallv may fail
+
     Returns
     -------
     data: ParticleDataT
@@ -59,7 +65,7 @@ def distribute(
     if nranks == 1:
         return data
 
-    rank = partition.rank
+    # rank = partition.rank
     comm = partition.comm
     dimensions = partition.dimensions
     ranklist = np.array(partition.ranklist)
@@ -92,59 +98,13 @@ def distribute(
         # there are no particles on this rank
         home_idx = np.empty(0, dtype=np.int32)
 
-    # sort by rank
-    s = np.argsort(home_idx)
-    home_idx = home_idx[s]
-
-    # offsets and counts
-    send_displacements = np.searchsorted(home_idx, np.arange(nranks))
-    send_displacements = send_displacements.astype(np.int32)
-    send_counts = np.append(send_displacements[1:], total_to_send) - send_displacements
-    send_counts = send_counts.astype(np.int32)
-
-    # announce to each rank how many objects will be sent
-    recv_counts = np.empty_like(send_counts)
-    comm.Alltoall(send_counts, recv_counts)
-    recv_displacements = np.insert(np.cumsum(recv_counts)[:-1], 0, 0)
-
-    # number of objects that this rank will receive
-    total_to_receive = np.sum(recv_counts)
-
-    # debug message
-    if verbose > 1:
-        for i in range(nranks):
-            if rank == i:
-                print(f"Distribute Debug Rank {i}")
-                print(f" - rank has {total_to_send} particles")
-                print(f" - rank receives {total_to_receive} particles")
-                print(f" - send_counts:        {send_counts}")
-                print(f" - send_displacements: {send_displacements}")
-                print(f" - recv_counts:        {recv_counts}")
-                print(f" - recv_displacements: {recv_displacements}")
-                print(f"", flush=True)
-            comm.Barrier()
-
-    # send data all-to-all, each array individually
-    data_new = {k: np.empty(total_to_receive, dtype=data[k].dtype) for k in data.keys()}
-
-    for k in data.keys():
-        d = data[k][s]
-        s_msg = [d, (send_counts, send_displacements), d.dtype.char]
-        r_msg = [data_new[k], (recv_counts, recv_displacements), d.dtype.char]
-        comm.Alltoallv(s_msg, r_msg)
-
-    if verify_count:
-        local_counts = np.array(
-            [len(data[coord_keys[0]]), len(data_new[coord_keys[0]])], dtype=np.int64
-        )
-        global_counts = np.empty_like(local_counts)
-        comm.Reduce(local_counts, global_counts, op=MPI.SUM, root=0)
-        if rank == 0 and global_counts[0] != global_counts[1]:
-            print(
-                f"Error in distribute: particle count during distribute was not maintained ({global_counts[0]} -> {global_counts[1]})",
-                file=sys.stderr,
-                flush=True,
-            )
-            comm.Abort()
+    data_new = distribute_dataset_by_home(
+        partition,
+        data,
+        home_idx=home_idx,
+        verbose=verbose,
+        verify_count=verify_count,
+        all2all_iterations=all2all_iterations,
+    )
 
     return data_new