squidpy/src/squidpy/experimental/im/_stain/_conversion.py at 2d7143c0885fd7e3d391ce280860d340435f1cca · scverse/squidpy · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
"""RGB <-> optical density (SDA) and RGB <-> Ruderman Lab conversions.

All functions operate on :class:`xarray.DataArray` with a channel dimension
named ``"c"`` of length 3. Numpy-backed and dask-backed inputs are both
supported transparently; nothing here forces materialisation of large arrays.
Each public function compiles down to a single :func:`xarray.apply_ufunc`
call so that dask schedules one task per chunk regardless of how many
elementwise and matrix steps the transform contains.
"""

from __future__ import annotations

import numpy as np
import xarray as xr

from squidpy.experimental.im._stain._constants import (
    RUDERMAN_LAB_TO_LMS,
    RUDERMAN_LMS_TO_LAB,
    RUDERMAN_LMS_TO_RGB,
    RUDERMAN_RGB_TO_LMS,
    SDA_SCALE,
)

_CHANNEL_DIM = "c"


def _check_channel_dim(arr: xr.DataArray) -> None:
    if _CHANNEL_DIM not in arr.dims:
        raise ValueError(f"Input must have a dimension named {_CHANNEL_DIM!r}; got dims {arr.dims}.")
    if arr.sizes[_CHANNEL_DIM] != 3:
        raise ValueError(f"Channel dimension {_CHANNEL_DIM!r} must have length 3; got {arr.sizes[_CHANNEL_DIM]}.")


def _working_dtype(arr: xr.DataArray) -> np.dtype:
    # Integer/uint inputs are promoted to float32 to keep dask graphs cheap
    # on whole-slide images; already-float inputs preserve caller dtype.
    return arr.dtype if np.issubdtype(arr.dtype, np.floating) else np.dtype(np.float32)


def _apply_along_channel(
    arr: xr.DataArray,
    kernel,
    *,
    out_dtype: np.dtype,
    **kwargs,
) -> xr.DataArray:
    """Run a per-chunk kernel that consumes and returns the channel axis.

    ``apply_ufunc`` moves the ``c`` core dim to the end of the output; we
    transpose back to the caller's original dim order so downstream
    consumers see a stable layout.
    """
    original_dims = arr.dims
    out = xr.apply_ufunc(
        kernel,
        arr,
        input_core_dims=[[_CHANNEL_DIM]],
        output_core_dims=[[_CHANNEL_DIM]],
        kwargs=kwargs,
        dask="parallelized",
        output_dtypes=[out_dtype],
    )
    return out.transpose(*original_dims)


def _rgb_to_sda_kernel(x: np.ndarray, *, bg: np.ndarray, dtype: np.dtype) -> np.ndarray:
    x = x.astype(dtype, copy=False)
    return (-np.log((x + 1.0) / (bg + 1.0)) * SDA_SCALE).astype(dtype, copy=False)


def _sda_to_rgb_kernel(x: np.ndarray, *, bg: np.ndarray, dtype: np.dtype) -> np.ndarray:
    rgb = (bg + 1.0) * np.exp(-x.astype(dtype, copy=False) / SDA_SCALE) - 1.0
    np.clip(rgb, 0.0, 255.0, out=rgb)
    return rgb.astype(dtype, copy=False)


def _rgb_to_lab_kernel(x: np.ndarray, *, dtype: np.dtype) -> np.ndarray:
    x = x.astype(dtype, copy=False)
    lms = x @ RUDERMAN_RGB_TO_LMS.T.astype(dtype, copy=False)
    np.log(lms + 1.0, out=lms)
    return (lms @ RUDERMAN_LMS_TO_LAB.T.astype(dtype, copy=False)).astype(dtype, copy=False)


def _lab_to_rgb_kernel(x: np.ndarray, *, dtype: np.dtype) -> np.ndarray:
    x = x.astype(dtype, copy=False)
    log_lms = x @ RUDERMAN_LAB_TO_LMS.T.astype(dtype, copy=False)
    # The +1.0 / -1.0 pair is paired with the matching offset in
    # `_rgb_to_lab_kernel` so the round trip remains exact for valid RGB.
    lms = np.exp(log_lms) - 1.0
    rgb = lms @ RUDERMAN_LMS_TO_RGB.T.astype(dtype, copy=False)
    np.clip(rgb, 0.0, 255.0, out=rgb)
    return rgb.astype(dtype, copy=False)


def rgb_to_sda(
    rgb: xr.DataArray,
    background_intensity: np.ndarray,
) -> xr.DataArray:
    """Convert RGB intensities to standard deviation per absorbance (SDA).

    Equivalent to optical density with a per-channel background ``I_0``::

        sda = -log((rgb + 1) / (I_0 + 1)) * SDA_SCALE

    The matched ``+1`` terms avoid ``log(0)`` at fully saturated black
    pixels and guarantee that pixels at the white point map exactly to
    zero. Scaling matches the HistomicsTK convention so that luminosity
    thresholds from the published H&E literature transfer directly.

    Parameters
    ----------
    rgb
        Image with a ``"c"`` dimension of length 3. May be numpy- or
        dask-backed; the operation is purely elementwise and stays lazy.
    background_intensity
        Per-channel white-point ``I_0`` as a shape-``(3,)`` numpy array.
        Required: no scanner produces a pure-white background, so the
        caller must supply either an estimate (PR 3 will ship the
        estimator) or, knowingly, an explicit
        ``np.array([255., 255., 255.])``.

    Returns
    -------
    SDA-space DataArray, float dtype. Lazy if and only if ``rgb`` was lazy.
    """
    _check_channel_dim(rgb)
    dtype = _working_dtype(rgb)
    bg = np.asarray(background_intensity, dtype=dtype)
    return _apply_along_channel(rgb, _rgb_to_sda_kernel, out_dtype=dtype, bg=bg, dtype=dtype)


def sda_to_rgb(
    sda: xr.DataArray,
    background_intensity: np.ndarray,
) -> xr.DataArray:
    """Convert SDA back to RGB intensities in ``[0, 255]``.

    Inverse of :func:`rgb_to_sda`. Pass the same ``background_intensity``
    used at encode time. The result is clipped to ``[0, 255]`` but kept in
    float dtype; uint8 conversion is the caller's choice.
    """
    _check_channel_dim(sda)
    dtype = _working_dtype(sda)
    bg = np.asarray(background_intensity, dtype=dtype)
    return _apply_along_channel(sda, _sda_to_rgb_kernel, out_dtype=dtype, bg=bg, dtype=dtype)


def rgb_to_lab_ruderman(rgb: xr.DataArray) -> xr.DataArray:
    """Convert RGB to Ruderman et al. (1998) decorrelated Lab space.

    This is the Lab variant used by Reinhard et al. (2001) for colour
    transfer, not CIE Lab. Results differ from
    :func:`skimage.color.rgb2lab`.

    The pipeline is RGB -> LMS via :data:`RUDERMAN_RGB_TO_LMS`, then
    ``log(LMS + 1)``, then LMS -> Lab via :data:`RUDERMAN_LMS_TO_LAB`. All
    steps fuse into a single per-chunk numpy kernel.
    """
    _check_channel_dim(rgb)
    dtype = _working_dtype(rgb)
    return _apply_along_channel(rgb, _rgb_to_lab_kernel, out_dtype=dtype, dtype=dtype)


def lab_ruderman_to_rgb(lab: xr.DataArray) -> xr.DataArray:
    """Inverse of :func:`rgb_to_lab_ruderman`.

    Returns RGB clipped to ``[0, 255]`` in float dtype; uint8 conversion is
    the caller's choice.
    """
    _check_channel_dim(lab)
    dtype = _working_dtype(lab)
    return _apply_along_channel(lab, _lab_to_rgb_kernel, out_dtype=dtype, dtype=dtype)