E3SM-Project
diff --git a/‎components/eamxx/cime_config/SystemTests/est.py‎
Lines changed: 198 additions & 0 deletions b/‎components/eamxx/cime_config/SystemTests/est.py‎
Lines changed: 198 additions & 0 deletions
diff --git a/‎components/eamxx/cime_config/SystemTests/est_perts.py‎
Lines changed: 86 additions & 0 deletions b/‎components/eamxx/cime_config/SystemTests/est_perts.py‎
Lines changed: 86 additions & 0 deletions
@@ -0,0 +1,198 @@
+"""
+Ensemble Statistical Test using multi-instance capability.
+
+This test runs multiple EAMxx instances with different perturbation seeds
+and uses statistical tests to verify that the climate state is identical
+between different runs.
+
+EST inherits from SystemTestsCommon and only overrides:
+- setup_phase (to setup multi-instance with per-instance perturbed seeds)
+- _generate_baseline (move needed hist files to baseline directory)
+- _compare_baseline methods (to run the statistical tests)
+
+EST relies on two util files:
+- est_perts.py: functions to duplicate and modify yaml files
+- est_stats.py: functions to conduct statistical testing
+"""
+
+import os
+import glob
+import logging
+import sys
+
+import CIME.test_status
+import CIME.utils
+from CIME.status import append_testlog
+from CIME.SystemTests.system_tests_common import SystemTestsCommon
+from CIME.case.case_setup import case_setup
+
+logger = logging.getLogger(__name__)
+
+
+# pylint: disable=too-few-public-methods
+class EST(SystemTestsCommon):
+    """Ensemble Statistical Test using multi-instance capability"""
+
+    # pylint: disable=too-many-arguments, too-many-positional-arguments
+    def setup_phase(
+        self,
+        clean=False,
+        test_mode=False,
+        reset=False,
+        keep=False,
+        disable_git=False,
+    ):
+        """setup phase implementation"""
+        # first call the parent method and flush
+        self.setup_indv(
+            clean=clean,
+            test_mode=test_mode,
+            reset=reset,
+            keep=keep,
+            disable_git=disable_git,
+        )
+        self._case.flush()
+        # and again...?
+        case_setup(self._case, test_mode=False, reset=True)
+
+        # get run directory
+        run_dir = self._case.get_value("RUNDIR")
+        # get n_inst
+        n_inst = int(self._case.get_value("NINST_ATM"))
+        # return early if n_inst <= 1
+        # we really don't want people to run this test with n_inst=1
+        if n_inst <= 1:
+            msg = (
+                f"NINST_ATM = {n_inst}. This test requires NINST_ATM > 1. "
+                "Consider setting NINST_ATM > 1 in your env_run.xml "
+                "or use _C# specifier in test name for a multi-driver "
+                "multi-instance setup (producing # pelayout copies), "
+                "or _N# for a single-driver multi-instance setup "
+                "(dividing specified pelayout among # instances)."
+            )
+            raise ValueError(msg)
+
+        # get est_perts functions
+        # but first add the directory to sys.path if not already there
+        est_perts_path = os.path.join(
+            os.path.dirname(__file__), 'est_perts.py'
+        )
+        if not os.path.exists(est_perts_path):
+            raise ImportError(
+                f"Cannot find est_perts.py at {est_perts_path}"
+            )
+        if os.path.dirname(__file__) not in sys.path:
+            sys.path.insert(0, os.path.dirname(__file__))
+        # pylint: disable=import-outside-toplevel
+        from est_perts import duplicate_yaml_file, update_yaml_file
+
+        # duplicate the yaml files n_inst times
+        duplicate_yaml_file(f"{run_dir}/data/scream_input.yaml", n_inst)
+        duplicate_yaml_file(f"{run_dir}/data/monthly_average.yaml", n_inst)
+        # Let's update the perturbation properties inside the yaml files
+        # this handles unique seeds and unique output files manually
+        for i in range(1, n_inst + 1):
+            yaml_file = f"{run_dir}/data/scream_input.yaml_{i:04d}"
+            out_file = f"{run_dir}/data/monthly_average.yaml_{i:04d}"
+            if not os.path.isfile(yaml_file):
+                raise FileNotFoundError(
+                    f"File {yaml_file} does not exist.")
+            if not os.path.isfile(out_file):
+                raise FileNotFoundError(f"File {out_file} does not exist.")
+            update_yaml_file(yaml_file, i, "pert")
+            update_yaml_file(out_file, i, "out")
+
+    def _generate_baseline(self):
+        """generate a new baseline case based on the current test"""
+        # might as well call the parent method first
+        super()._generate_baseline()
+
+        with CIME.utils.SharedArea():
+            # get the baseline and run directories
+            base_gen_dir = os.path.join(
+                self._case.get_value("BASELINE_ROOT"),
+                self._case.get_value("BASEGEN_CASE"),
+            )
+            run_dir = self._case.get_value("RUNDIR")
+
+            # for eamxx, we need to get all files that have
+            # *scream_????.h.*.nc added to this list
+            hists = glob.glob(
+                os.path.join(run_dir, "*scream_????.h.AVERAGE.*.nc")
+            )
+            hist_files = [os.path.basename(h) for h in hists]
+
+            for hist in hist_files:
+                src = os.path.join(run_dir, hist)
+                tgt = os.path.join(base_gen_dir, hist)
+                # remove baselines if they exist
+                # this is safe because cime forces users to use -o
+                if os.path.exists(tgt):
+                    os.remove(tgt)
+
+                # log and copy
+                logger.info(
+                    "Copying ... \n \t %s \n ... to ... \n \t %s \n\n",
+                    src, tgt
+                )
+                CIME.utils.safe_copy(src, tgt, preserve_meta=False)
+
+    def _compare_baseline(self):
+        """compare phase implementation"""
+        with self._test_status as ts:
+            # if we are resubmitting, then we don't do the comparison
+            if int(self._case.get_value("RESUBMIT")) > 0:
+                ts.set_status(
+                    CIME.test_status.BASELINE_PHASE,
+                    CIME.test_status.TEST_PASS_STATUS
+                )
+                return
+
+            # set to FAIL to start with, will update later
+            ts.set_status(
+                CIME.test_status.BASELINE_PHASE,
+                CIME.test_status.TEST_FAIL_STATUS
+            )
+
+            # get the run and baseline directories
+            run_dir = self._case.get_value("RUNDIR")
+            base_dir = os.path.join(
+                self._case.get_value("BASELINE_ROOT"),
+                self._case.get_value("BASECMP_CASE"),
+            )
+
+            # launch the statistics tests
+            # first, import est_stats funcs from the other file
+            est_stats_path = os.path.join(
+                os.path.dirname(__file__), 'est_stats.py'
+            )
+            if not os.path.exists(est_stats_path):
+                raise ImportError(
+                    f"Cannot find est_stats.py at {est_stats_path}"
+                )
+            # Add the directory to sys.path if not already there
+            if os.path.dirname(__file__) not in sys.path:
+                sys.path.insert(0, os.path.dirname(__file__))
+            # note be extra safe and import whole file
+            # because we want to avoid import errors of needed pkgs
+            # pylint: disable=import-outside-toplevel
+            import est_stats as est
+            # now, launch
+            comments, new_ts = est.run_stats_comparison(
+                run_dir,
+                base_dir,
+                analysis_type="spatiotemporal",
+                test_type="ks",
+                alpha=0.01,
+            )
+
+            if new_ts == "PASS":
+                out_ts = CIME.test_status.TEST_PASS_STATUS
+            else:
+                out_ts = CIME.test_status.TEST_FAIL_STATUS
+
+            # log the results and set the test status
+            append_testlog(comments, self._orig_caseroot)
+            ts.set_status(
+                CIME.test_status.BASELINE_PHASE, out_ts
+            )
@@ -0,0 +1,86 @@
+"""
+Perturbation functions for EST system test.
+"""
+
+import os
+import shutil
+
+
+def duplicate_yaml_file(yaml_file, num_copies):
+    """Duplicate a YAML file into multiple copies with four-digit suffixes."""
+
+    if not os.path.isfile(yaml_file):
+        raise FileNotFoundError(f"The file {yaml_file} does not exist.")
+
+    for i in range(1, num_copies + 1):
+        new_file = f"{yaml_file}_{i:04d}"
+        shutil.copyfile(yaml_file, new_file)
+
+
+def update_yaml_file(yaml_file, seed, pert_out):
+    """Update YAML input and output files with perturbation details."""
+
+    # Read the file content
+    with open(yaml_file, "r", encoding="utf-8") as file:
+        lines = file.readlines()
+
+    if pert_out == "pert":
+        found_seed = False
+        found_output = False
+        new_lines = []
+
+        # Process each line
+        for line in lines:
+            if line.strip().startswith("perturbation_random_seed:"):
+                # replace perturbation_random_seed: 0
+                #    with perturbation_random_seed: {seed}
+                new_lines.append(
+                    line.replace(
+                        "perturbation_random_seed: 0",
+                        f"perturbation_random_seed: {seed}",
+                    )
+                )
+                found_seed = True
+            elif "monthly_average.yaml" in line.strip():
+                # replace "monthly_average.yaml"
+                #    with "monthly_average.yaml_{seed:04d}"
+                new_lines.append(
+                    line.replace(
+                        "monthly_average.yaml",
+                        f"monthly_average.yaml_{seed:04d}"
+                    )
+                )
+                found_output = True
+            else:
+                new_lines.append(line)
+
+        if not found_seed:
+            raise ValueError(f"'perturbation_random_seed' NOT in {yaml_file}")
+        if not found_output:
+            raise ValueError(f"'monthly_average.yaml' NOT in {yaml_file}")
+
+        # Write back to file
+        with open(yaml_file, "w", encoding="utf-8") as file:
+            file.writelines(new_lines)
+
+    elif pert_out == "out":
+        # Track if we found and updated required fields
+        found_prefix = False
+
+        new_lines = []
+        # Process each line
+        for line in lines:
+            if line.strip().startswith("filename_prefix:"):
+                # replace ".scream" with ".scream_{seed:04d}"
+                new_lines.append(line.replace(
+                    ".scream", f".scream_{seed:04d}"))
+                found_prefix = True
+            else:
+                new_lines.append(line)
+
+        if not found_prefix:
+            raise ValueError(f"Couldn't find 'filename_prefix' in {yaml_file}")
+
+        # Write the new lines back to file
+        with open(yaml_file, "w", encoding="utf-8") as file:
+            file.writelines(new_lines)