Python API#

The Python API provides programmatic access to the coastal calibration workflow, enabling integration with other tools and custom automation.

Basic Usage#

from coastal_calibration import CoastalCalibConfig, CoastalCalibRunner

# Load configuration from YAML
config = CoastalCalibConfig.from_yaml("config.yaml")

# Create a runner
runner = CoastalCalibRunner(config)

# Validate configuration
errors = runner.validate()
if errors:
    for error in errors:
        print(f"Error: {error}")
else:
    # Submit the job
    result = runner.submit(wait=True)

    if result.success:
        print(f"Job {result.job_id} completed successfully")
    else:
        print(f"Job failed: {result.errors}")

Configuration#

Loading Configuration#

from coastal_calibration import CoastalCalibConfig

# From YAML file
config = CoastalCalibConfig.from_yaml("config.yaml")

# Access configuration values
print(config.slurm.job_name)
print(config.simulation.coastal_domain)
print(config.paths.work_dir)
print(config.model)  # "schism" or "sfincs"

Creating SCHISM Configuration Programmatically#

from datetime import datetime
from pathlib import Path
from coastal_calibration import (
    CoastalCalibConfig,
    SlurmConfig,
    SimulationConfig,
    BoundaryConfig,
    PathConfig,
    SchismModelConfig,
    MonitoringConfig,
    DownloadConfig,
)

config = CoastalCalibConfig(
    slurm=SlurmConfig(
        job_name="my_simulation",
    ),
    simulation=SimulationConfig(
        start_date=datetime(2021, 6, 11),
        duration_hours=24,
        coastal_domain="hawaii",
        meteo_source="nwm_ana",
    ),
    boundary=BoundaryConfig(source="stofs"),
    paths=PathConfig(
        work_dir=Path("/ngen-test/coastal/your_username/my_run"),
        raw_download_dir=Path("/ngen-test/coastal/your_username/downloads"),
    ),
    model_config=SchismModelConfig(
        nodes=2,
        ntasks_per_node=18,
    ),
)

# Save to YAML
config.to_yaml("generated_config.yaml")

Enabling NOAA Observation Station Comparison#

To automatically discover NOAA CO-OPS water level stations within the model domain and generate comparison plots after the SCHISM run, set include_noaa_gages=True in the model configuration:

config = CoastalCalibConfig(
    slurm=SlurmConfig(
        job_name="hawaii_with_obs",
    ),
    simulation=SimulationConfig(
        start_date=datetime(2021, 6, 11),
        duration_hours=24,
        coastal_domain="hawaii",
        meteo_source="nwm_ana",
    ),
    boundary=BoundaryConfig(source="stofs"),
    paths=PathConfig(
        work_dir=Path("/ngen-test/coastal/your_username/hawaii_obs"),
        raw_download_dir=Path("/ngen-test/coastal/your_username/downloads"),
    ),
    model_config=SchismModelConfig(
        nodes=2,
        ntasks_per_node=18,
        include_noaa_gages=True,  # Enable station discovery & comparison plots
    ),
)

This activates two additional stages in the pipeline:

schism_obs discovers NOAA CO-OPS stations via the concave hull of the open boundary nodes and writes station.in and station_noaa_ids.txt.
schism_plot reads SCHISM station output (staout_1), fetches observations from the CO-OPS API (with MLLW→MSL datum conversion), and saves comparison plots to figs/.

Creating SFINCS Configuration Programmatically#

from datetime import datetime
from pathlib import Path
from coastal_calibration import (
    CoastalCalibConfig,
    SlurmConfig,
    SimulationConfig,
    BoundaryConfig,
    PathConfig,
    SfincsModelConfig,
)

TEXAS_DIR = Path("/path/to/texas/model")

config = CoastalCalibConfig(
    slurm=SlurmConfig(),
    simulation=SimulationConfig(
        start_date=datetime(2025, 6, 1),
        duration_hours=168,
        coastal_domain="atlgulf",
        meteo_source="nwm_ana",
    ),
    boundary=BoundaryConfig(source="stofs"),
    paths=PathConfig(
        work_dir=Path("/tmp/sfincs_run"),
        raw_download_dir=Path("/tmp/sfincs_downloads"),
    ),
    model_config=SfincsModelConfig(
        prebuilt_dir=TEXAS_DIR,
        discharge_locations_file=TEXAS_DIR / "sfincs_nwm.src",
        observation_points=[
            {"x": 830344.95, "y": 3187383.41, "name": "Sargent"},
        ],
        merge_observations=False,
        merge_discharge=False,
        include_noaa_gages=True,
        include_precip=True,
        include_wind=True,
        include_pressure=True,
        forcing_to_mesh_offset_m=0.0,  # STOFS already in mesh datum
        vdatum_mesh_to_msl_m=0.171,  # mesh datum (NAVD88) → MSL for obs comparison
        meteo_res=2000,  # meteo output resolution in metres (auto-derived if None)
    ),
)

Configuration Validation#

config = CoastalCalibConfig.from_yaml("config.yaml")

# Validate and get list of errors
errors = config.validate()

if errors:
    print("Configuration errors:")
    for error in errors:
        print(f"  - {error}")
else:
    print("Configuration is valid")

Workflow Execution#

Submit to SLURM#

Both run() and submit() execute the same stage pipeline. submit() automatically partitions stages: Python-only stages run on the login node, while container stages are bundled into a SLURM job.

from coastal_calibration import CoastalCalibConfig, CoastalCalibRunner

config = CoastalCalibConfig.from_yaml("config.yaml")
runner = CoastalCalibRunner(config)

# Submit and return immediately
result = runner.submit(wait=False)
print(f"Job {result.job_id} submitted")

# Submit and wait for completion
result = runner.submit(wait=True)
if result.success:
    print(f"Job completed in {result.duration_seconds:.1f}s")

# Submit partial pipeline
result = runner.submit(wait=True, start_from="boundary_conditions")
result = runner.submit(wait=True, stop_after="post_forcing")

Run Directly#

For testing or when already inside a SLURM job:

# Run complete workflow
result = runner.run()

# Run partial workflow
result = runner.run(start_from="pre_forcing", stop_after="post_forcing")

# Run from a specific stage to the end
result = runner.run(start_from="pre_schism")

Workflow Result#

The WorkflowResult object contains information about the execution:

result = runner.submit(wait=True)

print(f"Success: {result.success}")
print(f"Job ID: {result.job_id}")
print(f"Duration: {result.duration_seconds}s")

if not result.success:
    for error in result.errors:
        print(f"Error: {error}")

# Stage timing (if enable_timing is True)
for stage, duration in result.stage_durations.items():
    print(f"  {stage}: {duration:.1f}s")

Data Sources#

Check Available Date Ranges#

from coastal_calibration.downloader import validate_date_ranges

# Validate dates for your configuration
errors = validate_date_ranges(
    start_time=datetime(2021, 6, 11),
    end_time=datetime(2021, 6, 12),
    meteo_source="nwm_ana",
    boundary_source="stofs",
    coastal_domain="hawaii",
)

if errors:
    print("Date range errors:", errors)

Supported Data Sources#

Source	Date Range	Description
`nwm_retro`	1979-02-01 to 2023-01-31	NWM Retrospective 3.0
`nwm_ana`	2018-09-17 to present	NWM Analysis
`stofs`	2020-12-30 to present	STOFS water levels
`glofs`	2005-09-30 to present	Great Lakes OFS

Logging#

Configure logging for the workflow:

import logging
from coastal_calibration.utils.logging import setup_logger

# Set up logging
logger = setup_logger(log_level="DEBUG", log_file="workflow.log")

# Now run your workflow
config = CoastalCalibConfig.from_yaml("config.yaml")
runner = CoastalCalibRunner(config)
result = runner.submit(wait=True)

Example: Batch Processing#

Run multiple simulations with different parameters:

from datetime import datetime, timedelta
from coastal_calibration import CoastalCalibConfig, CoastalCalibRunner

# Load base configuration
base_config = CoastalCalibConfig.from_yaml("base_config.yaml")

# Run simulations for multiple dates
start_dates = [
    datetime(2021, 6, 1),
    datetime(2021, 6, 15),
    datetime(2021, 7, 1),
]

results = []
for start_date in start_dates:
    # Modify configuration for this run
    config = CoastalCalibConfig.from_yaml("base_config.yaml")
    config.simulation.start_date = start_date

    # Update work directory for this run
    date_str = start_date.strftime("%Y%m%d")
    config.paths.work_dir = config.paths.work_dir.parent / f"run_{date_str}"

    # Submit
    runner = CoastalCalibRunner(config)
    result = runner.submit(wait=False)  # Don't wait, submit all jobs
    results.append((start_date, result))

# Report job IDs
for start_date, result in results:
    print(f"{start_date}: Job {result.job_id}")

Example: Domain Comparison#

Run the same simulation across multiple domains:

domains = ["hawaii", "prvi", "atlgulf", "pacific"]

for domain in domains:
    config = CoastalCalibConfig.from_yaml("base_config.yaml")
    config.simulation.coastal_domain = domain

    runner = CoastalCalibRunner(config)
    errors = runner.validate()

    if errors:
        print(f"{domain}: Validation failed - {errors}")
        continue

    result = runner.submit(wait=True)
    print(f"{domain}: {'Success' if result.success else 'Failed'}")