Add 50-year repeat-year chain workflow for glorysv12-curvilinear

fluidnumericsJoe · claude · fluidnumericsJoe · commit f1b0b1eef2b1 · 2026-04-04T19:40:51.000-04:00
Submits 50 sequential 1-year SLURM jobs (Jul 2002–Jul 2003), each
resetting the calendar to avoid leap-year drift. A pickup-to-init
converter extracts the final state from each run to seed the next.

Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/simulations/glorysv12-curvilinear/workflows/repeat_year_chain.sh b/simulations/glorysv12-curvilinear/workflows/repeat_year_chain.sh
@@ -0,0 +1,78 @@
+#!/bin/bash
+# repeat_year_chain.sh — Submit 50 chained repeat-year simulations.
+#
+# Each simulation runs July 1, 2002 → July 1, 2003 (365 days, nIter0=0).
+# After each run completes, the next job converts its pickup file to
+# initial conditions and launches a fresh 1-year run.
+#
+# Usage:
+#   cd simulations/glorysv12-curvilinear
+#   bash workflows/repeat_year_chain.sh [--dry-run]
+#
+# Requirements:
+#   - The MITgcm data namelist must have nIter0=0, endTime=31536000.0
+#   - The data.cal must have startDate_1=20020701
+#   - EXF/OBC forcing files must cover the full Jul 2002–Jul 2003 period
+
+set -euo pipefail
+
+SCRIPT_DIR=$(dirname "$(readlink -f "$0")")
+SIMULATION_DIR=$(dirname "$SCRIPT_DIR")
+
+N_RUNS=50
+EXPERIMENT="repeat-year-50"
+DRY_RUN=false
+
+if [[ "${1:-}" == "--dry-run" ]]; then
+    DRY_RUN=true
+    echo "[DRY RUN] Will print sbatch commands without submitting."
+fi
+
+EXPERIMENT_DIR="${SIMULATION_DIR}/${EXPERIMENT}"
+mkdir -p "${EXPERIMENT_DIR}"
+
+echo "======================================="
+echo " Repeat-year chain: ${N_RUNS} runs"
+echo " Experiment dir: ${EXPERIMENT_DIR}"
+echo "======================================="
+
+PREV_JOB_ID=""
+
+for i in $(seq 1 $N_RUNS); do
+    RUN_NUM=$(printf "%03d" $i)
+    PREV_RUN_NUM=""
+    if [[ $i -gt 1 ]]; then
+        PREV_RUN_NUM=$(printf "%03d" $((i - 1)))
+    fi
+
+    SBATCH_ARGS=(
+        -n64
+        -c1
+        --time=3-00:00:00
+        --nodelist=noether
+        --job-name="repeat_yr_${RUN_NUM}"
+        --output="${EXPERIMENT_DIR}/${RUN_NUM}-%A.out"
+        --error="${EXPERIMENT_DIR}/${RUN_NUM}-%A.out"
+        --chdir="${SIMULATION_DIR}"
+        --export="ALL,RUN_NUM=${RUN_NUM},PREV_RUN_NUM=${PREV_RUN_NUM},EXPERIMENT=${EXPERIMENT},SIMULATION_DIR=${SIMULATION_DIR}"
+    )
+
+    if [[ -n "$PREV_JOB_ID" ]]; then
+        SBATCH_ARGS+=(--dependency=afterok:${PREV_JOB_ID})
+    fi
+
+    if $DRY_RUN; then
+        echo "  [${RUN_NUM}] sbatch ${SBATCH_ARGS[*]} ${SCRIPT_DIR}/repeat_year_run.sh"
+        PREV_JOB_ID="FAKE_${RUN_NUM}"
+    else
+        JOB_ID=$(sbatch "${SBATCH_ARGS[@]}" "${SCRIPT_DIR}/repeat_year_run.sh" | awk '{print $NF}')
+        echo "  Submitted run ${RUN_NUM}: SLURM job ${JOB_ID}"
+        PREV_JOB_ID=$JOB_ID
+    fi
+done
+
+echo ""
+echo "All ${N_RUNS} jobs submitted."
+if ! $DRY_RUN; then
+    echo "Monitor with:  squeue -u \$USER --name='repeat_yr_*'"
+fi
diff --git a/simulations/glorysv12-curvilinear/workflows/repeat_year_run.sh b/simulations/glorysv12-curvilinear/workflows/repeat_year_run.sh
@@ -0,0 +1,82 @@
+#!/bin/bash
+# repeat_year_run.sh — SLURM job script for one year of a repeat-year chain.
+#
+# Expected environment variables (set by repeat_year_chain.sh via --export):
+#   RUN_NUM         — zero-padded run number (001–050)
+#   EXPERIMENT      — experiment subdirectory name (e.g. repeat-year-50)
+#   SIMULATION_DIR  — absolute path to simulations/glorysv12-curvilinear
+#   PREV_RUN_NUM    — previous run number (empty for run 001)
+#
+# The script:
+#   1. Creates the run directory with symlinks to input/
+#   2. For runs > 001: converts the previous run's pickup to init files
+#   3. Launches MITgcm (64-rank MPI)
+
+set -euo pipefail
+
+SCRIPT_DIR=$(dirname "$(readlink -f "$0")")
+source "$SCRIPT_DIR/env.sh"
+
+REPO_ROOT=$(readlink -f "$SIMULATION_DIR/../..")
+RUN_DIR="${EXPERIMENT}/${RUN_NUM}"
+ITER_FINAL="0000087600"
+
+echo "======================================="
+echo ""
+echo " Repeat-year experiment : ${EXPERIMENT}"
+echo " Run number             : ${RUN_NUM}"
+echo " Run directory          : ${RUN_DIR}"
+echo " Simulation directory   : ${SIMULATION_DIR}"
+echo " MITgcm image           : ${MITGCM_BASE_IMG}"
+echo " SLURM Job ID           : ${SLURM_JOB_ID:-none}"
+echo ""
+echo "======================================="
+
+###############################################################################
+# Step 1: Set up run directory — symlink all input files
+###############################################################################
+echo "--- Setting up run directory ---"
+srun --ntasks=1 \
+     --mpi=pmix \
+     --container-image=$MITGCM_BASE_IMG \
+     --container-mounts=$SIMULATION_DIR:/workspace:rw \
+     --container-env=RUN_DIR \
+     /bin/bash -c "mkdir -p /workspace/$RUN_DIR && ln -sf /workspace/input/* /workspace/$RUN_DIR/"
+
+echo "  > Symlinks created."
+
+###############################################################################
+# Step 2: For runs after 001, convert previous pickup to init files
+###############################################################################
+if [[ -n "${PREV_RUN_NUM:-}" ]]; then
+    PREV_DIR="${EXPERIMENT}/${PREV_RUN_NUM}"
+    PICKUP_PREFIX="${PREV_DIR}/pickup.${ITER_FINAL}"
+
+    echo "--- Converting pickup from run ${PREV_RUN_NUM} ---"
+    echo "  Pickup: ${PICKUP_PREFIX}"
+    echo "  Output: ${RUN_DIR}/"
+
+    srun --ntasks=1 \
+         --mpi=pmix \
+         --container-image=$SPECTRE_UTILS_IMG \
+         --container-mounts=${REPO_ROOT}:/repo:rw \
+         /bin/bash -c "cd /repo && python spectre_utils/pickup_to_init.py \
+             simulations/glorysv12-curvilinear/${PICKUP_PREFIX} \
+             simulations/glorysv12-curvilinear/${RUN_DIR}/ \
+             --nx 768 --ny 424 --nr 50"
+
+    echo "  > Init files created from pickup."
+fi
+
+###############################################################################
+# Step 3: Launch MITgcm
+###############################################################################
+echo "--- Launching MITgcm ---"
+srun --mpi=pmix \
+     --cpu-bind=cores \
+     --container-image=$MITGCM_BASE_IMG \
+     --container-mounts=$SIMULATION_DIR:/workspace:rw \
+     --container-env=RUN_DIR \
+     /bin/bash -c "source /opt/spack-environment/activate.sh && cd /workspace/$RUN_DIR && /workspace/exe/mitgcmuv"
+
+echo "--- Run ${RUN_NUM} complete ---"
diff --git a/spectre_utils/pickup_to_init.py b/spectre_utils/pickup_to_init.py
@@ -0,0 +1,142 @@
+#!/usr/bin/env python3
+"""Convert an MITgcm binary pickup file to individual init files.
+
+Reads the pickup.<iter>.data/.meta pair and writes:
+  T.init.bin, S.init.bin, U.init.bin, V.init.bin, Eta.init.bin
+
+The pickup is float64 (MITgcm default for checkpoints); init files are
+written as float32 (matching readBinaryPrec=32 in data PARM01).
+
+Usage:
+    python pickup_to_init.py <pickup_prefix> <output_dir> [--nx 768] [--ny 424] [--nr 50]
+
+Example:
+    python pickup_to_init.py repeat-year-50/001/pickup.0000087600 repeat-year-50/002/
+"""
+
+import argparse
+import re
+import sys
+from pathlib import Path
+
+import numpy as np
+
+
+def parse_pickup_meta(meta_path: Path) -> dict:
+    """Parse a MITgcm .meta file and return dims, precision, and field list."""
+    text = meta_path.read_text()
+
+    # Extract dimensions
+    dim_match = re.search(r"dimList\s*=\s*\[\s*([\d\s,]+)\]", text)
+    if not dim_match:
+        raise ValueError(f"Cannot parse dimList from {meta_path}")
+    dims = [int(x) for x in dim_match.group(1).replace(",", " ").split()]
+    nx, ny = dims[0], dims[3]
+
+    # Extract precision
+    prec_match = re.search(r"dataprec\s*=\s*\[\s*'(\w+)'\s*\]", text)
+    dtype = np.float64 if prec_match and "64" in prec_match.group(1) else np.float32
+
+    # Extract number of records
+    nrec_match = re.search(r"nrecords\s*=\s*\[\s*(\d+)\s*\]", text)
+    nrecords = int(nrec_match.group(1)) if nrec_match else None
+
+    # Extract field list
+    fld_match = re.search(r"fldList\s*=\s*\{([^}]+)\}", text)
+    if not fld_match:
+        raise ValueError(f"Cannot parse fldList from {meta_path}")
+    fields = re.findall(r"'(\w+)\s*'", fld_match.group(1))
+
+    return {"nx": nx, "ny": ny, "dtype": dtype, "nrecords": nrecords, "fields": fields}
+
+
+def pickup_to_init(pickup_prefix: str, output_dir: str, nx: int, ny: int, nr: int):
+    """Read a pickup file and write individual init .bin files."""
+    meta_path = Path(pickup_prefix + ".meta")
+    data_path = Path(pickup_prefix + ".data")
+    out = Path(output_dir)
+
+    if not meta_path.exists():
+        raise FileNotFoundError(f"Meta file not found: {meta_path}")
+    if not data_path.exists():
+        raise FileNotFoundError(f"Data file not found: {data_path}")
+
+    meta = parse_pickup_meta(meta_path)
+    dtype = meta["dtype"]
+    fields = meta["fields"]
+    rec_size = nx * ny
+
+    print(f"Pickup: {data_path}")
+    print(f"  Grid: {nx} x {ny} x {nr}")
+    print(f"  Precision: {dtype}")
+    print(f"  Fields: {fields}")
+    print(f"  Total records: {meta['nrecords']}")
+
+    # Map pickup field names to init file names and their depth (nr for 3D, 1 for 2D)
+    field_map = {
+        "Uvel": ("U.init.bin", nr),
+        "Vvel": ("V.init.bin", nr),
+        "Theta": ("T.init.bin", nr),
+        "Salt": ("S.init.bin", nr),
+        "EtaN": ("Eta.init.bin", 1),
+    }
+
+    # Compute byte offsets for each field in the pickup
+    bytes_per_val = np.dtype(dtype).itemsize
+    rec_bytes = rec_size * bytes_per_val
+
+    # Build offset table: walk through fields in order
+    offsets = {}
+    current_rec = 0
+    for fld in fields:
+        # 3D fields have nr levels, 2D fields have 1 level
+        if fld in ("EtaN", "dEtaHdt", "EtaH"):
+            nlevels = 1
+        else:
+            nlevels = nr
+        offsets[fld] = (current_rec, nlevels)
+        current_rec += nlevels
+
+    print(f"  Computed record layout: {offsets}")
+
+    # Read and write the fields we need
+    out.mkdir(parents=True, exist_ok=True)
+    with open(data_path, "rb") as f:
+        for fld_name, (init_name, nlevels) in field_map.items():
+            if fld_name not in offsets:
+                print(f"  WARNING: field '{fld_name}' not found in pickup, skipping")
+                continue
+
+            start_rec, expected_levels = offsets[fld_name]
+            assert expected_levels == nlevels, (
+                f"Level mismatch for {fld_name}: expected {nlevels}, got {expected_levels}"
+            )
+
+            # Seek to field start and read
+            f.seek(start_rec * rec_bytes)
+            data = np.fromfile(f, dtype=dtype, count=rec_size * nlevels)
+            data = data.reshape((nlevels, ny, nx))
+
+            # Convert to float32 for init files
+            init_path = out / init_name
+            data.astype(np.float32).tofile(init_path)
+            size_mb = init_path.stat().st_size / 1e6
+            print(f"  Wrote {init_path} ({size_mb:.1f} MB)")
+
+    print("Done.")
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Convert MITgcm pickup to init files")
+    parser.add_argument("pickup_prefix", help="Path prefix (without .data/.meta)")
+    parser.add_argument("output_dir", help="Directory to write init files")
+    parser.add_argument("--nx", type=int, default=768, help="Grid points in X")
+    parser.add_argument("--ny", type=int, default=424, help="Grid points in Y")
+    parser.add_argument("--nr", type=int, default=50, help="Grid points in Z")
+    args = parser.parse_args()
+
+    pickup_to_init(args.pickup_prefix, args.output_dir, args.nx, args.ny, args.nr)
+
+
+if __name__ == "__main__":
+    main()