Skip to content

Commit e722114

Browse files
authored
DAS-2292: regression test for the smap-l2-gridder (nasa#130)
1 parent 7baded6 commit e722114

16 files changed

+480
-50
lines changed

.gitattributes

+2
Original file line numberDiff line numberDiff line change
@@ -3,3 +3,5 @@ test/subset-band-name/reference_data/*.hdf filter=lfs diff=lfs merge=lfs -text
33
test/opera-rtc-s1-browse/reference_data/*.png filter=lfs diff=lfs merge=lfs -text
44
test/hybig/reference_data/**/*.png filter=lfs diff=lfs merge=lfs -text
55
test/hybig/reference_data/**/*.jpg filter=lfs diff=lfs merge=lfs -text
6+
test/smap-l2-gridder/reference_files/SPL2SMP_E_reference.nc filter=lfs diff=lfs merge=lfs -text
7+
test/smap-l2-gridder/reference_files/SPL2SMAP_reference.nc filter=lfs diff=lfs merge=lfs -text

.github/workflows/build-all-images.yml

+5
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,11 @@ jobs:
4343
notebook: "SubsetBandName_Regression.ipynb"
4444
shared-utils: "true"
4545
lfs: "true"
46+
-
47+
image: "smap-l2-gridder"
48+
notebook: "smap-l2-gridder_Regression.ipynb"
49+
shared-utils: "true"
50+
lfs: "true"
4651
-
4752
image: "swath-projector"
4853
notebook: "SwathProjector_Regression.ipynb"

.github/workflows/notebook-test-suite.yml

+6-1
Original file line numberDiff line numberDiff line change
@@ -57,6 +57,7 @@ on:
5757
- hoss
5858
- hybig
5959
- query-cmr
60+
- smap-l2-gridder
6061
- subset-band-name
6162
- swath-projector
6263
- trajectory-subsetter
@@ -133,7 +134,11 @@ jobs:
133134
uses: actions/checkout@v4
134135

135136
- name: Pull Docker image
136-
run: docker pull ghcr.io/nasa/regression-tests-${{ matrix.service }}:${{ github.event.client_payload.docker-image-tag || inputs.docker-image-tag || 'latest' }}
137+
run: docker pull ghcr.io/${{github.repository_owner}}/regression-tests-${{ matrix.service }}:${{ github.event.client_payload.docker-image-tag || inputs.docker-image-tag || 'latest' }}
138+
139+
- name: Update Test Image Name
140+
run: |
141+
echo "REGRESSION_TESTS_$(echo "${{ matrix.service }}" | tr '[:lower:]' '[:upper:]' | tr '-' '_')_IMAGE=ghcr.io/${{ github.repository_owner }}/regression-tests-${{ matrix.service }}:${{ github.event.client_payload.docker-image-tag || inputs.docker-image-tag || 'latest' }}" >> $GITHUB_ENV
137142
138143
- name: Execute notebook
139144
id: test-step

CHANGELOG.md

+4
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,10 @@ versioning. Rather than a static releases, this repository contains of a number
55
of regression tests that are each semi-independent. This CHANGELOG file should be used
66
to document pull requests to this repository.
77

8+
## 2025-01-31 ([#130](https://github.com/nasa/harmony-regression-tests/pull/130))
9+
10+
- Add tests and configuration for harmony-smap-l2-gridder.
11+
812
## 2024-12-20([#126](https://github.com/nasa/harmony-regression-tests/pull/126))
913

1014
- Update configuration to run `opera-rtc-s1-browse` tests on HyBIG deployments.

README.md

+2-2
Original file line numberDiff line numberDiff line change
@@ -229,7 +229,7 @@ channels:
229229
- conda-forge
230230
- nodefaults
231231
dependencies:
232-
- python=3.11
232+
- python=3.12
233233
- jupyter
234234
- requests
235235
- netcdf4
@@ -243,7 +243,7 @@ dependencies:
243243

244244
### Versioning
245245

246-
The regression test notebooks follow semantic versioning:
246+
The regression test notebooks try to follow semantic versioning:
247247

248248
```
249249
major.minor.patch
+21-20
Original file line numberDiff line numberDiff line change
@@ -1,22 +1,23 @@
11
{
2-
"all": "harmony,harmony-regression,geoloco,hga,n2z,regridder,hoss,hybig,net2cog,subset-band-name,swath-projector,nsidc-icesat2,trajectory-subsetter,opera-rtc-s1-browse",
3-
"batchee": "TBD",
4-
"geoloco": "geoloco",
5-
"giovanni-adapter": "TBD",
6-
"harmony-gdal-adapter": "hga",
7-
"harmony-netcdf-to-zarr": "n2z",
8-
"harmony-regridder": "regridder",
9-
"harmony-service-example": "harmony-regression",
10-
"hoss": "hoss",
11-
"hybig": "hybig,opera-rtc-s1-browse",
12-
"net2cog": "net2cog",
13-
"podaac-concise": "TBD",
14-
"podaac-l2-subsetter": "TBD",
15-
"query-cmr": "geoloco",
16-
"sds-maskfill": "TBD",
17-
"stitchee": "TBD",
18-
"subset-band-name": "subset-band-name",
19-
"swath-projector": "swath-projector",
20-
"trajectory-subsetter": "nsidc-icesat2,trajectory-subsetter",
21-
"opera-rtc-s1-browse": "opera-rtc-s1-browse"
2+
"all": "harmony,harmony-regression,geoloco,hga,n2z,regridder,hoss,hybig,net2cog,smap-l2-gridder,subset-band-name,swath-projector,nsidc-icesat2,trajectory-subsetter,opera-rtc-s1-browse",
3+
"batchee": "TBD",
4+
"geoloco": "geoloco",
5+
"giovanni-adapter": "TBD",
6+
"harmony-gdal-adapter": "hga",
7+
"harmony-netcdf-to-zarr": "n2z",
8+
"harmony-regridder": "regridder",
9+
"harmony-service-example": "harmony-regression",
10+
"hoss": "hoss",
11+
"hybig": "hybig,opera-rtc-s1-browse",
12+
"net2cog": "net2cog",
13+
"podaac-concise": "TBD",
14+
"podaac-l2-subsetter": "TBD",
15+
"query-cmr": "geoloco",
16+
"smap-l2-gridder": "smap-l2-gridder",
17+
"sds-maskfill": "TBD",
18+
"stitchee": "TBD",
19+
"subset-band-name": "subset-band-name",
20+
"swath-projector": "swath-projector",
21+
"trajectory-subsetter": "nsidc-icesat2,trajectory-subsetter",
22+
"opera-rtc-s1-browse": "opera-rtc-s1-browse"
2223
}

config/services_tests_config_uat.json

+21-20
Original file line numberDiff line numberDiff line change
@@ -1,22 +1,23 @@
11
{
2-
"all": "harmony,harmony-regression,geoloco,hga,n2z,regridder,hoss,variable-subsetter,hybig,net2cog,subset-band-name,swath-projector,nsidc-icesat2,trajectory-subsetter,opera-rtc-s1-browse",
3-
"batchee": "TBD",
4-
"geoloco": "geoloco",
5-
"giovanni-adapter": "TBD",
6-
"harmony-gdal-adapter": "hga",
7-
"harmony-netcdf-to-zarr": "n2z",
8-
"harmony-regridder": "regridder",
9-
"harmony-service-example": "harmony-regression",
10-
"hoss": "hoss, variable-subsetter",
11-
"hybig": "hybig,opera-rtc-s1-browse",
12-
"net2cog": "net2cog",
13-
"podaac-concise": "TBD",
14-
"podaac-l2-subsetter": "TBD",
15-
"query-cmr": "variable-subsetter",
16-
"sds-maskfill": "TBD",
17-
"stitchee": "TBD",
18-
"subset-band-name": "subset-band-name",
19-
"swath-projector": "swath-projector",
20-
"trajectory-subsetter": "nsidc-icesat2,trajectory-subsetter",
21-
"opera-rtc-s1-browse": "opera-rtc-s1-browse"
2+
"all": "harmony,harmony-regression,geoloco,hga,n2z,regridder,hoss,variable-subsetter,hybig,net2cog,smap-l2-gridder,subset-band-name,swath-projector,nsidc-icesat2,trajectory-subsetter,opera-rtc-s1-browse",
3+
"batchee": "TBD",
4+
"geoloco": "geoloco",
5+
"giovanni-adapter": "TBD",
6+
"harmony-gdal-adapter": "hga",
7+
"harmony-netcdf-to-zarr": "n2z",
8+
"harmony-regridder": "regridder",
9+
"harmony-service-example": "harmony-regression",
10+
"hoss": "hoss, variable-subsetter",
11+
"hybig": "hybig,opera-rtc-s1-browse",
12+
"net2cog": "net2cog",
13+
"podaac-concise": "TBD",
14+
"podaac-l2-subsetter": "TBD",
15+
"query-cmr": "variable-subsetter",
16+
"smap-l2-gridder": "smap-l2-gridder",
17+
"sds-maskfill": "TBD",
18+
"stitchee": "TBD",
19+
"subset-band-name": "subset-band-name",
20+
"swath-projector": "swath-projector",
21+
"trajectory-subsetter": "nsidc-icesat2,trajectory-subsetter",
22+
"opera-rtc-s1-browse": "opera-rtc-s1-browse"
2223
}

script/test-in-bamboo.sh

+18-1
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,24 @@ echo "harmony host url: ${harmony_host_url}"
4242
## e.g. if REGRESSION_TESTS_N2Z_IMAGE environment was set, the value would be used instead of the default.
4343

4444
image_names=()
45-
all_tests=(harmony harmony-regression hoss hga n2z nsidc-icesat2 swath-projector trajectory-subsetter variable-subsetter regridder hybig geoloco net2cog subset-band-name opera-rtc-s1-browse)
45+
all_tests=(
46+
geoloco
47+
harmony
48+
harmony-regression
49+
hga
50+
hoss
51+
hybig
52+
n2z
53+
net2cog
54+
nsidc-icesat2
55+
opera-rtc-s1-browse
56+
regridder
57+
smap-l2-gridder
58+
subset-band-name
59+
swath-projector
60+
trajectory-subsetter
61+
variable-subsetter
62+
)
4663
for image in "${all_tests[@]}"; do
4764
image_names+=($(image_name "$image" true))
4865
done

test/Makefile

+6
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,11 @@ regridder-image: Dockerfile regridder/environment.yaml
3131
docker build -t ghcr.io/nasa/regression-tests-regridder:latest -f ./Dockerfile \
3232
--build-arg notebook=Regridder_Regression.ipynb --build-arg sub_dir=regridder .
3333

34+
smap-l2-gridder-image: Dockerfile smap-l2-gridder/environment.yaml
35+
docker build -t ghcr.io/nasa/regression-tests-smap-l2-gridder:latest -f ./Dockerfile \
36+
--build-arg notebook=smap-l2-gridder_Regression.ipynb --build-arg sub_dir=smap-l2-gridder \
37+
--build-arg shared_utils=true .
38+
3439
swath-projector-image: Dockerfile swath-projector/environment.yaml
3540
docker build -t ghcr.io/nasa/regression-tests-swath-projector:latest -f ./Dockerfile \
3641
--build-arg notebook=SwathProjector_Regression.ipynb --build-arg sub_dir=swath-projector .
@@ -69,6 +74,7 @@ images: harmony-image \
6974
n2z-image \
7075
nsidc-icesat2-image \
7176
regridder-image \
77+
smap-l2-gridder-image \
7278
subset-band-name-image \
7379
swath-projector-image \
7480
trajectory-subsetter-image \

test/run_notebooks.sh

+18-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,24 @@ echo "Running regression tests"
1515

1616
# Specify the test images to run, by default all built by the Makefile. If
1717
# the script is invoked with a list of images, only run those.
18-
all_images=(harmony harmony-regression hoss hga n2z nsidc-icesat2 swath-projector trajectory-subsetter variable-subsetter regridder hybig geoloco net2cog subset-band-name opera-rtc-s1-browse)
18+
all_images=(
19+
geoloco
20+
harmony
21+
harmony-regression
22+
hga
23+
hoss
24+
hybig
25+
n2z
26+
net2cog
27+
nsidc-icesat2
28+
opera-rtc-s1-browse
29+
regridder
30+
smap-l2-gridder
31+
subset-band-name
32+
swath-projector
33+
trajectory-subsetter
34+
variable-subsetter
35+
)
1936
specified_images=()
2037
# Parse command line arguments
2138
while [[ $# -gt 0 ]]; do

test/shared_utils/compare.py

+58-5
Original file line numberDiff line numberDiff line change
@@ -18,17 +18,35 @@ def compare_results_to_reference_file(
1818
reference_file_name: str,
1919
identical: bool = True,
2020
coordinates_to_fix: list[str] | None = None,
21+
subset_selector: dict | None = None,
2122
) -> None:
22-
"""Use `DataTree` functionality to compare data values, variables,
23-
coordinates, metadata, and all their corresponding attributes of
24-
downloaded results to a reference file.
23+
"""Compare two files as DataTrees
24+
25+
Args:
26+
results_file_name: Path to the results file to validate
27+
28+
reference_file_name: Path to the reference file to compare against
29+
30+
identical: If True, use strict comparison including attributes; if
31+
False, compare only values
32+
33+
coordinates_to_fix: List of coordinate names to be renamed in the case
34+
that the input has "unalignable" names.
35+
36+
subset_selector: Dict of top level group names to selection
37+
dictionaries used to subset the input DataTree to the
38+
previously subsetted reference data. (see
39+
`subset_datatree`'s doc string for more information)
40+
41+
Raises:
42+
AssertionError: when files don't match according to comparison criteria.
2543
2644
"""
2745
if coordinates_to_fix is None:
2846
coordinates_to_fix = []
2947

30-
reference_groups = open_groups(reference_file_name)
31-
results_groups = open_groups(results_file_name)
48+
reference_groups = open_groups(reference_file_name, decode_times=False)
49+
results_groups = open_groups(results_file_name, decode_times=False)
3250

3351
# Fix unalignable coordinates
3452
for coord in coordinates_to_fix:
@@ -38,6 +56,10 @@ def compare_results_to_reference_file(
3856
reference_data = DataTree.from_dict(reference_groups)
3957
results_data = DataTree.from_dict(results_groups)
4058

59+
# Limit comparison of data
60+
if subset_selector is not None:
61+
results_data = subset_datatree(results_data, subset_selector)
62+
4163
if identical:
4264
assert results_data.identical(
4365
reference_data
@@ -51,6 +73,37 @@ def compare_results_to_reference_file(
5173
results_data = None
5274

5375

76+
def subset_datatree(dt: DataTree, selectors: dict[str, dict]) -> DataTree:
77+
"""Using a selector dictionary return a subset of the input DataTree.
78+
79+
Args:
80+
dt: Input Datatree to subset
81+
selectors: Dictionary mapping top level group names to dictionaries,
82+
where each dictionary contains dimension names to indices
83+
selected by slice.
84+
85+
a sample selector dictionary:
86+
selectors = {
87+
"Soil_Moisture_Retrieval_Data_3km": {
88+
"y-dim": slice(1000, 2000),
89+
"x-dim": slice(8800, 9800),
90+
},
91+
"Soil_Moisture_Retrieval_Data": {
92+
"y-dim": slice(0, 1000),
93+
"x-dim": slice(2500, 3500),
94+
},
95+
}
96+
97+
This is used to subset the SPL2SMAP granule, the data groups are the keys
98+
and the dimensions are subset into 1000x1000 grids that include valid
99+
output data.
100+
"""
101+
out_dt = dt.copy()
102+
for group_name, slices in selectors.items():
103+
out_dt[group_name] = out_dt[group_name].isel(slices)
104+
return out_dt
105+
106+
54107
def unalign_groups(
55108
dict_of_datasets: dict[str, Dataset], coordinate: str
56109
) -> dict[str, Dataset]:

test/smap-l2-gridder/environment.yaml

+14
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,14 @@
1+
name: papermill-smap-l2-gridder
2+
channels:
3+
- conda-forge
4+
- nodefaults
5+
dependencies:
6+
- python=3.12
7+
- netCDF4=1.7.2
8+
- notebook=7.2.2
9+
- numpy=2.1.3
10+
- papermill=2.6.0
11+
- pip
12+
- pip:
13+
- harmony-py==0.4.15
14+
- xarray==2025.1.2
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
version https://git-lfs.github.com/spec/v1
2+
oid sha256:3acdb7f4643f7b78a8a476d7fd7f30799c08fdd5e97d1d6c5099f94161ce3e38
3+
size 8324662
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
version https://git-lfs.github.com/spec/v1
2+
oid sha256:befba2b98fea018e6dce1d2f9cd3a284c3577894d7134791abcbba5d404e4720
3+
size 18809225

0 commit comments

Comments
 (0)