release_evaluation_tool2/reval.py at main · AWI-ESM/release_evaluation_tool2 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
"""
AWI-CM3 Release Evaluation Tool (Reval.py)

This script provides a comprehensive evaluation framework for analyzing and visualizing
data from the AWI-CM-v3.3 climate model. It integrates scientific libraries for data
processing, statistical analysis, and high-quality visualizations, enabling effective
assessment of model performance against observations and reanalysis datasets.

Key Features:
- Data Processing & Analysis:
  - Uses PyFESOM2, xarray, SciPy, and scikit-learn for structured climate data handling.
- Visualization:
  - Leverages Matplotlib, Seaborn, Cartopy, and cmocean for high-quality plots.
- FESOM-Specific Routines:
  - Includes functions for handling FESOM2 mesh structures, model data, and
    meridional overturning circulation (MOC).
- Automated Job Submission:
  - Supports SLURM-based batch processing for large-scale evaluations.
- Multi-Experiment Support:
  - Handles spin-up, preindustrial control, and historical simulations with
    configurable paths and settings.


2021-12-10: Jan Streffing:                First jupyter notebook version for https://doi.org/10.5194/gmd-15-6399-2022
2024-04-03: Jan Streffing:                Addition of significance metrics for https://doi.org/10.5194/egusphere-2024-2491
2025-02-04: Jan Streffing:                Re-write has parallel scripts
"""

import os
import sys
import subprocess
import argparse
from natsort import natsorted
import shutil

############################
# Slurm Configuration      #
############################

SBATCH_SETTINGS = """\
#!/bin/bash
#SBATCH --job-name={job_name}
#SBATCH --output=logs/{job_name}.log
#SBATCH --error=logs/{job_name}.log
#SBATCH --time=02:00:00
#SBATCH --ntasks=128
#SBATCH --ntasks-per-node=128
#SBATCH --partition=compute
#SBATCH -A bb1469
"""


############################
# Script Execution         #
############################

# Parse command line arguments
parser = argparse.ArgumentParser(
    description='AWI-CM3 Release Evaluation Tool - Submit analysis jobs',
    formatter_class=argparse.RawDescriptionHelpFormatter,
    epilog='''
Examples:
  python reval.py --config configs/AWI-CM3-v3.3.py
  python reval.py --status
''')
parser.add_argument(
    '-c', '--config',
    help='Path to configuration file in configs/ folder (e.g., configs/AWI-CM3-v3.3.py)')
parser.add_argument(
    '-s', '--status',
    action='store_true',
    help='Show status of all scripts and exit')
args = parser.parse_args()

# Handle --status
if args.status:
    from bg_routines.update_status import get_all_status
    status = get_all_status()
    if not status:
        print("No status information found yet.")
    else:
        print(f"{'Script':<40} {'Status'}")
        print("-" * 70)
        for script, stat in status.items():
            print(f"{script:<40} {stat}")
    sys.exit(0)

# Require --config for job submission
if not args.config:
    parser.error("--config is required when submitting jobs")

# Validate config file exists
if not os.path.exists(args.config):
    print(f"ERROR: Config file not found: {args.config}")
    print("\nAvailable configs in configs/:")
    for f in sorted(os.listdir('configs')):
        if f.endswith('.py'):
            print(f"  - configs/{f}")
    sys.exit(1)

config_path = os.path.abspath(args.config)
print(f"Using configuration: {config_path}")
print(f"{'='*60}\n")

# Ensure required directories exist
os.makedirs("logs", exist_ok=True)
os.makedirs("tmp", exist_ok=True)

# Locate all part##_*.py analysis scripts in the "scripts" subfolder
script_files = natsorted(
    [f for f in os.listdir("scripts") if f.endswith(".py") and f.startswith("part")]
)

# Default: Disable all scripts (set to True to enable)
SCRIPTS = {script: False for script in script_files}  # All disabled by default

# Enable scripts manually here:
SCRIPTS.update({
    "part1_mesh_plot.py":           True,
    "part2_rad_balance.py":         True,
    "part3_hovm_temp.py":           True,
    "part4_cmpi.py":                True,
    "part5_sea_ice_thickness.py":   True,
    "part6_ice_conc_timeseries.py": True,
    "part7_mld.py":                 True,
    "part8_t2m_vs_era5.py":         True,
    "part9_rad_vs_ceres.py":        True,
    "part10_clt_vs_modis.py":       True,
    "part11_zonal_plots.py":        True,
    "part12_qbo.py":                True,
    "part13_fesom_temp_bias.py":    True,
    "part14_fesom_salt_bias.py":    True,
    "part15_enso.py":               True,
    "part16_clim_change.py":        True,
    "part17_moc.py":                True,
    "part18_precip_vs_gpcp.py":     True,
    "part19_ocean_temp_sections.py":True,
    "part20_gregory_plot.py":       True,
    "part21_crf_bias_maps.py":      True,
    "part22_masks.py":              True,
    "part23_ice_cavity_velocities.py": True,
    "part24_lpjg_lai.py":           True,
    "part25_lpjg_carbon.py":        True,
    "part26_lpjg_pft.py":           True,
})

# Submit jobs and collect job IDs for the report dependency
submitted_job_ids = []

for script, run in SCRIPTS.items():
    if run:
        job_script = f"slurm_{script}.sh"
        script_path = os.path.join("scripts", script)

        # Write the SLURM script
        with open(job_script, "w") as f:
            f.write(SBATCH_SETTINGS.format(job_name=script))
            f.write(f"\nsource $HOME/loadconda.sh\n")  # Load Python module if required
            f.write("\nconda activate reval\n")  # Load Python module if required
            f.write(f"\nexport REVAL_CONFIG={config_path}\n")  # Pass config file path
            f.write(f"python {script_path}\n")

        # Submit job and capture job ID
        print(f"Submitting {script} as:")
        result = subprocess.run(["sbatch", job_script], capture_output=True, text=True)
        print(result.stdout.strip())
        # Parse job ID from "Submitted batch job 12345678"
        if result.returncode == 0 and "Submitted" in result.stdout:
            try:
                job_id = result.stdout.strip().split()[-1]
                submitted_job_ids.append(job_id)
            except (IndexError, ValueError):
                pass
        destination = f"tmp/{job_script}"
        shutil.move(job_script, destination)
    else:
        print(f"Skipped {script} (disabled)")

# Submit HTML report generation after all analysis jobs finish
if submitted_job_ids:
    print(f"\n{'='*60}")
    print(f"Submitting HTML report generator (after {len(submitted_job_ids)} jobs)...")

    SBATCH_REPORT = """\
#!/bin/bash
#SBATCH --job-name=generate_report
#SBATCH --output=logs/generate_report.log
#SBATCH --error=logs/generate_report.log
#SBATCH --time=00:10:00
#SBATCH --ntasks=1
#SBATCH --partition=compute
#SBATCH -A bb1469
"""
    report_script = "slurm_generate_report.sh"
    dep_str = ":".join(submitted_job_ids)
    with open(report_script, "w") as f:
        f.write(SBATCH_REPORT)
        f.write(f"\nsource $HOME/loadconda.sh\n")
        f.write("conda activate reval\n")
        f.write(f"\nexport REVAL_CONFIG={config_path}\n")
        f.write("python scripts/generate_report.py\n")

    result = subprocess.run(
        ["sbatch", f"--dependency=afterany:{dep_str}", report_script],
        capture_output=True, text=True)
    print(result.stdout.strip())
    shutil.move(report_script, f"tmp/{report_script}")
    print("Report will be generated after all analysis jobs complete.")