add dashboard scripts and unified compy cron job

jaelynlitz · jaelynlitz · commit 2b410bbe4921 · 2025-08-01T17:58:27.000-07:00
diff --git a/jenkins/compy_cron.sh b/jenkins/compy_cron.sh
@@ -0,0 +1,84 @@
+#!/bin/bash
+
+main() {
+
+    #---------------------------------------------------------------
+    # User-defined configuration
+    #---------------------------------------------------------------
+    #path to E3SM
+    code_root="/compyfs/litz372/e3sm_scratch/performance_testing/E3SM"
+    
+    #machine to run the test on
+    mach="compy"
+
+    #compiler
+    compiler=intel
+
+    #set resolution
+    resolution=ne30pg2_ne30pg2
+
+    #set the length of the simulation (ie Ld5 for 5 days or Ln5 for 5 timesteps) 
+    simulation_length=Ld5
+
+    #directory for all the past and current data
+    data_dest="/qfs/projects/eagles/litz372/performance_data/${simulation_length}"
+
+    #path where the latest time series plot is saved, accessible to the whole project
+    share_dest="/compyfs/www/litz372/performance_data"
+    
+    #url where the plot will be available - based on the share_dest
+    share_url_ne30="https://compy-dtn.pnl.gov/litz372/performance_data/performance_comp_${resolution}_${simulation_length}.png"
+
+    #load modules
+    source /etc/profile.d/modules.sh
+    module load python/3.11.5
+
+    ulimit -d unlimited
+    ulimit -s unlimited
+    ulimit -c unlimited
+
+    #---------------------------------------------------------------
+    # User-defined configuration ENDs
+    #---------------------------------------------------------------
+
+    #---------------------------------------------------------------
+    # RUN NE30 SIMULATION 
+    #---------------------------------------------------------------
+
+    /compyfs/litz372/e3sm_scratch/performance_testing/E3SM_test_scripts/jenkins/mam4xx_compare_performance.sh -r $resolution -c $compiler -t $simulation_length -m $mach -p $code_root -d $data_dest -s $share_dest -u $share_url_ne30
+
+    #---------------------------------------------------------------
+    # RUN NE4 SIMULATION 
+    #---------------------------------------------------------------
+
+    resolution=ne4pg2_ne4pg2
+    share_url_ne4="https://compy-dtn.pnl.gov/litz372/performance_data/performance_comp_${resolution}_${simulation_length}.png"
+    /compyfs/litz372/e3sm_scratch/performance_testing/E3SM_test_scripts/jenkins/mam4xx_compare_performance.sh -r $resolution -c $compiler -t $simulation_length -m $mach -p $code_root -d $data_dest -s $share_dest -u $share_url_ne4
+
+    #---------------------------------------------------------------
+    # RUN PERFORMANCE BREAKDOWN 
+    #---------------------------------------------------------------
+
+    module unload python
+    module load python/miniconda4.12.0
+    /compyfs/litz372/e3sm_scratch/compare_model_performance/E3SM_test_scripts/jenkins/compy_model_performance.sh
+
+    #---------------------------------------------------------------
+    # APPEND LINE GRAPHS TO BREAKDOWN 
+    #---------------------------------------------------------------
+
+    #plot line in dash comp
+    source ${code_root}/../.venv/bin/activate
+    output_graph=${share_dest}/../compare_performance/plot.html
+    echo $share_url_ne4 
+    echo $share_url_ne30
+    echo $output_graph
+    python3 /compyfs/litz372/e3sm_scratch/compare_model_performance/E3SM_test_scripts/jenkins/plot_html.py -i ${share_url_ne4} -o ${output_graph} 
+    python3 /compyfs/litz372/e3sm_scratch/compare_model_performance/E3SM_test_scripts/jenkins/plot_html.py -i ${share_url_ne30} -o ${output_graph} 
+
+}
+
+#--------------------------
+# Start the script
+#--------------------------
+main 
diff --git a/jenkins/compy_model_performance.sh b/jenkins/compy_model_performance.sh
@@ -0,0 +1,206 @@
+#!/bin/bash
+
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# Description:
+#   This script automates the process of comparing model performance between master and development branches of E3SM.
+#
+# Usage:
+#   Customize the user input section below before running the script.
+#---------------------------------------------------------------------------
+#---------------------------------------------------------------------------
+
+main() {
+
+    #---------------------------------------------------------------
+    # User-defined configuration
+    #---------------------------------------------------------------
+
+    # Perlmutter
+    # machine=pm-cpu 
+    # compiler=gnu 
+    # project=e3sm 
+    # workdir=/pscratch/sd/m/meng/compare_model_performance 
+    # plotdir=/global/cfs/cdirs/e3sm/www/meng/compare_performance  # make sure this a www in your Community directory to check the plot as a html page
+    # html_address=https://portal.nersc.gov/cfs/e3sm/meng/compare_performance
+    # module load python 
+
+    # Compy
+    machine=compy
+    compiler=intel
+    project=e3sm 
+    workdir=/compyfs/litz372/e3sm_scratch/compare_model_performance 
+    plotdir=/compyfs/www/litz372/compare_performance
+    html_address=https://compy-dtn.pnl.gov/litz372/compare_performance  
+    source /etc/profile.d/modules.sh
+    module load python/miniconda4.12.0 
+    source /share/apps/python/miniconda4.12.0/etc/profile.d/conda.sh
+    source ${workdir}/venv/bin/activate
+
+    if [ ! -d $plotdir ]; then
+        mkdir -p $plotdir 
+    fi
+
+    compset=F2010-EAMxx-MAM4xx   #F2010-SCREAMv1 
+#    resolution=ne4pg2_oQU480 
+    resolution=ne30pg2_ne30pg2
+    pe=P32
+    runtime=Ln5 
+    queue=debug
+    wallclock_time=00:05:00
+
+    # SMS test run
+    case=SMS_$pe_$runtime.$resolution.$compset.${machine}_$compiler
+
+    branch1=master
+
+    datestr=`date +'%Y%m%d_%H%M%S'`
+    casename1=master
+
+    code_root1=$workdir/E3SM-$casename1 
+
+    do_fetch_code=true
+    do_run_case=true
+
+    # If you only need to tweak the plot, set the plot_str to the date string of the run.
+    do_plot=true 
+    #plot_str=20250703_030001
+
+    #---------------------------------------------------------------
+    # User-defined configuration ENDs
+    #---------------------------------------------------------------
+
+    # Fetch code from GitHub 
+    fetch_code $branch1 $code_root1 &
+    wait 
+
+    if [ $? != 0 ]; then
+        echo "Error fetching code from GitHub"
+        exit 1
+    fi
+
+    # Create SMS test case and run it 
+    run_case $code_root1 $casename1 &
+    wait 
+
+    if [ $? != 0 ]; then
+        echo "Error compiling or running case"
+        exit 1
+    fi
+
+    # Grab timing data and do the plotting
+    if [ "${do_plot,,}" != "true" ]; then
+        echo $'\n----- Skipping plot -----\n'
+        return
+    fi
+    if [ -z "${plot_str+x}" ]; then
+        plot_str=$datestr 
+    fi
+
+    case_root1=$workdir/$case.${casename1}_${plot_str}  
+
+    python ${workdir}/E3SM_test_scripts/jenkins/mam4xx_compare_model_performance_plot.py \
+        --case1 $case_root1 --casename1 $casename1 \
+        --outdir $plotdir --html $html_address              
+
+    if [ $? != 0 ]; then
+        echo "Error plotting model performance"
+        exit 1
+    fi
+
+    echo "Model performance comparison complete!"
+
+}
+
+#---------------------
+# Function Definitions
+#---------------------
+
+fetch_code() {    
+    if [ "${do_fetch_code,,}" != "true" ]; then
+        echo $'\n----- Skipping fetch_code -----\n'
+        return
+    fi
+    local branch=$1 
+    local path=$2 
+
+    echo "Fetching code from $branch branch to $path..."
+    if [ -d $path ]; then
+        echo "Code directory $path already exists. Removing it..."
+        rm -rf $path 
+    fi 
+    
+    mkdir -p $path 
+    pushd $path 
+    git clone git@github.com:E3SM-Project/E3SM.git .     
+    if [ '$branch' != 'master' ]; then
+        git checkout $branch
+    fi
+    git submodule update --init --recursive     
+    popd
+} 
+
+run_case() {
+    if [ "${do_run_case,,}" != "true" ]; then
+        echo $'\n----- Skipping create_newcase -----\n'
+        return
+    fi
+
+    local code_root=$1 
+    local casename=$2 
+
+    local interval=60  # seconds to wait between each check 
+
+    path=$workdir/$case.${casename}_${datestr} 
+
+    # create new case and build it 
+    echo "Creating case $case.${casename}_${datestr}..."
+    $code_root/cime/scripts/create_test $case \
+        -t ${casename}_${datestr} -p $project -q $queue --output-root $workdir --no-run #--no-build   
+
+    if [ $? != 0 ]; then
+        echo "Error creating case $case"
+        exit 1
+    fi   
+
+    # submit job and monitor status
+    pushd $path 
+    ./xmlchange JOB_WALLCLOCK_TIME=$wallclock_time 
+    ./case.submit >& log.submit 
+
+    if [ $? != 0 ]; then
+        echo "Error submitting job for $case"
+        exit 1
+    fi
+
+    jobID=`awk -F " " '($1=="Submitted") {print $NF}' log.submit | tail -n 1 `
+    
+    while true; do 
+        sacct --job $jobID > log.job_stat
+        jobST=` awk "{if(NR==3) print}" log.job_stat | awk '{printf"%s\n",$6}'`
+
+        if [ "${jobST}" == "COMPLETED" ]; then
+            printf "%s Run complete: %-30s jobID: %s\n" "$(date +'%Y-%m-%d %H:%M:%S')" "$casename" "$jobID"
+            break 
+        elif [[ ("${jobST}" == "FAILED") || ("${jobST}" == *"CANCELLED"*) || ("${jobST}" == "TIMEOUT") ]]; then
+            printf "%s Run failed: %-30s jobID: %s\n" "$(date +'%Y-%m-%d %H:%M:%S')" "$casename" "$jobID"
+            exit 1 
+        else
+            printf "%s Waiting for case: %-30s to complete...  jobID: %s\n" "$(date +'%Y-%m-%d %H:%M:%S')" "$casename" "$jobID"
+            sleep $interval
+        fi
+    done 
+
+    popd 
+}
+
+# Silent versions of popd and pushd
+pushd() {
+    command pushd "$@" > /dev/null
+}
+popd() {
+    command popd "$@" > /dev/null
+}
+
+# Run the script
+main 
diff --git a/jenkins/plot_html.py b/jenkins/plot_html.py
@@ -0,0 +1,28 @@
+import argparse
+import matplotlib.pyplot as plt
+import sys
+
+def parse_args(argv):
+  parser = argparse.ArgumentParser(description='Plot EAMxx-MAM4xx performance data')
+  parser.add_argument('-i', '--input', metavar='r', type=ascii, nargs='+',
+                     help='input performance comp graph')
+
+  parser.add_argument('-o', '--output', metavar='m', type=ascii, nargs='+',
+                     help='html output dash graph')
+
+  args = vars(parser.parse_args())
+
+  input_graph = args["input"][0].strip("'""'")
+  output_graph = args["output"][0].strip("'""'")
+
+  return input_graph, output_graph 
+
+input_graph, output_graph = parse_args(sys.argv[1:])
+
+# Append the image to the HTML file
+html_content = f'<img src="{input_graph}" alt="comparison between EAMxx and EAMxx+MAM4xx">\n'
+with open(f'{output_graph}', "a") as html_file:
+    html_file.write(html_content)
+
+# Display the HTML file path
+print(f"HTML file generated: {output_graph}")