openclimatefix
diff --git a/‎pyproject.toml‎
Lines changed: 9 additions & 5 deletions b/‎pyproject.toml‎
Lines changed: 9 additions & 5 deletions
diff --git a/‎tests/__init__.py‎ ‎src/__init__.py‎tests/__init__.py renamed to src/__init__.py b/‎tests/__init__.py‎ ‎src/__init__.py‎tests/__init__.py renamed to src/__init__.py
diff --git a/‎src/cloudcasting_metrics/__init__.py‎ b/‎src/cloudcasting_metrics/__init__.py‎
diff --git a/‎src/cloudcasting_metrics/app.py‎
Lines changed: 196 additions & 0 deletions b/‎src/cloudcasting_metrics/app.py‎
Lines changed: 196 additions & 0 deletions
diff --git a/‎tests/conftest.py‎
Lines changed: 65 additions & 13 deletions b/‎tests/conftest.py‎
Lines changed: 65 additions & 13 deletions
diff --git a/‎tests/test_cloudcasting_app/__init__.py‎ b/‎tests/test_cloudcasting_app/__init__.py‎
diff --git a/‎tests/test_app.py‎ ‎tests/test_cloudcasting_app/test_app.py‎tests/test_app.py renamed to tests/test_cloudcasting_app/test_app.py
Lines changed: 3 additions & 3 deletions b/‎tests/test_app.py‎ ‎tests/test_cloudcasting_app/test_app.py‎tests/test_app.py renamed to tests/test_cloudcasting_app/test_app.py
Lines changed: 3 additions & 3 deletions
diff --git a/‎tests/test_cloudcasting_metrics/__init__.py‎ b/‎tests/test_cloudcasting_metrics/__init__.py‎
@@ -6,7 +6,7 @@ build-backend = "setuptools.build_meta"
 
 # Metadata (see https://peps.python.org/pep-0621/)
 [project]
-name = "cloudcasting-app"
+name = "cloudcasting-mlops"
 dynamic = ["version"] # Set automtically using git: https://setuptools-git-versioning.readthedocs.io/en/stable/
 description = "An app for running the OCF cloudcasting model in production"
 readme = {file = "README.md", content-type = "text/markdown"}
@@ -20,14 +20,15 @@ classifiers = [
     "License :: OSI Approved :: MIT License",
 ]
 dependencies = [
-    "fsspec==2025.7.0",
+    "fsspec==2025.9.0",
     "huggingface-hub==0.28.1",
     "hydra-core==1.3.2",
+    "icechunk==1.1.5",
     "loguru == 0.7.3",
     "numpy==2.1.2",
     "ocf-data-sampler==0.5.27",
     "pandas==2.2.3",
-    "s3fs==2025.7.0",
+    "s3fs==2025.9.0",
     "safetensors==0.5.2",
     "sat_pred @ git+https://github.com/openclimatefix/sat_pred.git@main",
     # Since torch distributes CPU only packages as wheels, have to specify the target platform in order to pull the wheel compiled for that specific platform
@@ -57,6 +58,9 @@ cloudcasting-app = "cloudcasting_app.app:main"
 [project.urls]
 repository = "https://github.com/openclimatefix/cloudcasting-app"
 
+[tool.setuptools.packages.find]
+where = ["src"]
+
 [tool.setuptools]
 include-package-data = false
 
@@ -125,8 +129,8 @@ docstring-code-line-length = 100
 # --- DOCUMENTATION CONFIGURATION --- #
 
 [tool.pydoctor]
-add-package = ["src/cloudcasting_app"]
-project-base-dir = "src/cloudcasting_app"
+add-package = ["cloudcasting_app", "cloudcasting_metrics"]
+project-base-dir = "src"
 docformat = "google"
 html-output = "docs"
 theme = "classic"
 
@@ -0,0 +1,196 @@
+"""Runs metric calculations on cloudcasting for a given input day and appends to zarr store
+
+This app expects these environmental variables to be available:
+ - SATELLITE_ICECHUNK_ARCHIVE (str): Path at which ground truth satellite data can be found
+ - CLOUDCASTING_PREDICTION_DIRECTORY (str): The directory where the cloudcasting forecasts are 
+   saved
+ - METRIC_ZARR_PATH (str): The path where the metric values will be saved
+
+ If the SATELLITE_ICECHUNK_ARCHIVE is an s3 path, then the environment variables 
+ AWS_ACCESS_KEY_ID, AWS_SECRET_ACCESS_KEY and AWS_REGION must also be set.
+"""
+
+import os
+import re
+import fsspec
+import numpy as np
+import pandas as pd
+from tqdm import tqdm
+
+import xarray as xr
+import icechunk
+from loguru import logger
+
+# ---------------------------------------------------------------------------
+
+# The forecast produces these horizon steps
+FORECAST_STEPS = pd.timedelta_range(start="15min", end="180min", freq="15min")
+# The forecast is run at this frequency
+FORECAST_FREQ = pd.Timedelta("30min")
+
+
+def open_icechunk(path: str) -> xr.Dataset:
+    """Open an icechunk store to xarray Dataset
+    
+    Args:
+        path: The path to the local or s3 icechunk store
+    """
+
+    if path.startswith("s3://"):
+        bucket, _, path = path.removeprefix("s3://").partition("/")
+        store = icechunk.s3_storage(
+            bucket=bucket,
+            prefix=path,
+            access_key_id=os.environ["AWS_ACCESS_KEY_ID"],
+            secret_access_key=os.environ["AWS_SECRET_ACCESS_KEY"],
+            region=os.environ["AWS_REGION"],
+        )
+    else:
+        store = icechunk.local_filesystem_storage(path=path)
+
+    repo = icechunk.Repository.open(store)
+    session = repo.readonly_session("main")
+    return xr.open_zarr(session.store)
+
+
+def app(date: pd.Timestamp | None = None) -> None:
+    """Runs metric calculations on cloudcasting for a given input day and appends to zarr store
+
+    Args:
+        date: The day for which the cloudcasting predictions will be scored.
+    """
+
+    # Unpack environmental variables
+    sat_path = os.environ["SATELLITE_ICECHUNK_ARCHIVE"]
+    prediction_dir = os.environ["CLOUDCASTING_PREDICTION_DIRECTORY"]
+    metric_zarr_path = os.environ["METRIC_ZARR_PATH"]
+
+
+    now = pd.Timestamp.now(tz="UTC").replace(tzinfo=None)
+
+    # Default to yesterday
+    if date is None:
+        date = now.floor("1D") - pd.Timedelta("1D")
+    
+    start_dt =  date.floor("1D")
+    end_dt = date.floor("1D") + pd.Timedelta("1D")
+
+    if now <= end_dt + FORECAST_STEPS.max():
+        raise Exception(
+            f"We cannot score forecast with init-time {end_dt} until after the last valid-time."
+        )
+
+    # Open the satellite data store
+    ds_sat = open_icechunk(path=sat_path)
+
+    # Slice to only the timesteps we need for scoring
+    ds_sat = ds_sat.sel(time=slice(start_dt, end_dt + FORECAST_STEPS.max()))
+
+    # It is better to preload if we have the RAM space
+    # - This eliminates any costs of repeatedly streaming data from the bucket
+    # - It's also faster
+    ds_sat = ds_sat.compute()
+
+    # Find recent forecasts
+    date_string = start_dt.strftime("%Y-%m-%d")
+    remote_path = f"{prediction_dir}/{date_string}*.zarr"
+    fs, path = fsspec.core.url_to_fs(remote_path)
+
+    file_list = fs.glob(path)
+
+    # Filter forecasts
+    # - We only score forecasts we have the satellite data for
+    # - If we are missing one satellite image we will skip scoring all forecasts require that
+    forecasts_to_score = []
+
+    for file in file_list:
+        # Find the datetime of this forecast
+        match = re.search(r'\d{4}-\d{2}-\d{2}T\d{2}:\d{2}', file)
+        assert match
+
+        # Check the satellite data required to score it is present
+        init_time = pd.Timestamp(match.group(0))
+        if np.isin(init_time + FORECAST_STEPS, ds_sat.time).all():
+            forecasts_to_score.append(file)
+        else:
+            logger.warn(f"Cannot score {file} due to missing satellite data")
+
+    ds_mae_list = []
+
+    for file in tqdm(forecasts_to_score):
+        ds_forecast = xr.open_zarr(fs.get_mapper(file)).compute()
+
+        valid_times = pd.Timestamp(ds_forecast.init_time.item()) + ds_forecast.step
+
+        ds_forecast = (
+            ds_forecast
+            .assign_coords(time=valid_times)
+            .swap_dims({"step":"time"})
+        )
+
+        ds_sat_sel = ds_sat.sel(
+            time=ds_forecast.time,
+            x_geostationary=ds_forecast.x_geostationary,
+            y_geostationary=ds_forecast.y_geostationary,
+            variable=ds_forecast.variable,
+        )
+
+        da_mae = np.abs(
+            (ds_sat_sel.data - ds_forecast.sat_pred)
+            .swap_dims({"time":"step"})
+            .drop_vars("time")
+        )
+
+        # Create reductions of the full MAE matrix
+        da_mae_step = da_mae.mean(dim=("x_geostationary", "y_geostationary", "variable"))
+        da_mae_variable = da_mae.mean(dim=("x_geostationary", "y_geostationary", "step"))
+        da_mae_spatial = da_mae.mean(dim=("step", "variable"))
+
+        ds_mae_reductions = xr.Dataset(
+            {
+                "mae_step": da_mae_step,
+                "mae_variable": da_mae_variable,
+                "mae_spatial": da_mae_spatial,
+            }
+        )
+
+        ds_mae_list.append(ds_mae_reductions)
+
+    # Concat all the MAE scores and in-fill missing init times with NaNs
+    # - Filling with NaNs makes the chunking easier
+    ds_all_maes = xr.concat(ds_mae_list, dim="init_time")
+    expected_init_times = pd.date_range(start_dt, end_dt, freq=FORECAST_FREQ, inclusive="left")
+    ds_all_maes = ds_all_maes.reindex(init_time=expected_init_times, method=None)
+
+    # Chunk the data ready for saving
+    ds_all_maes = ds_all_maes.chunk(
+        {
+            "x_geostationary": -1, 
+            "y_geostationary": -1, 
+            "step": -1, 
+            "variable": -1, 
+            "init_time": 48
+            }
+    )
+
+    # If it exists, open the archive of MAE values and check the coordinates against them
+    fs, stripped = fsspec.core.url_to_fs(metric_zarr_path)
+    if fs.exists(stripped):
+        ds_maes_archive = xr.open_zarr(metric_zarr_path)
+
+        if np.isin(ds_all_maes.init_time, ds_maes_archive.init_time).any():
+            raise Exception("init-times in new MAEs already exist in MAE store")
+        
+        for coord in ["variable", "step", "x_geostationary", "y_geostationary"]:
+            if not ds_maes_archive[coord].identical(ds_all_maes[coord]):
+                raise Exception("Found differences in coord: {coord}")
+                
+        ds_all_maes.to_zarr(metric_zarr_path, mode="a-", append_dim="init_time")
+
+    else:
+        ds_all_maes.to_zarr(metric_zarr_path, mode="w")
+
+
+
+if __name__ == "__main__":
+    app()
@@ -1,35 +1,31 @@
-import os
-
-import fsspec
+from pathlib import Path
 import numpy as np
 import pandas as pd
 import pytest
 import xarray as xr
 import zarr
+from cloudcasting_metrics.app import FORECAST_STEPS, FORECAST_FREQ
+import icechunk
+from icechunk.xarray import to_icechunk
 
 xr.set_options(keep_attrs=True)
 
 @pytest.fixture()
-def test_t0():
+def init_time():
     return pd.Timestamp.now(tz="UTC").replace(tzinfo=None).floor("30min")
 
 
-def make_sat_data(test_t0, freq_mins):
+def make_sat_data(times: pd.DatetimeIndex):
 
     # Load dataset which only contains coordinates, but no data
-    shell_path = f"{os.path.dirname(os.path.abspath(__file__))}/test_data/non_hrv_shell.zarr.zip"
+    shell_path = f"{Path(__file__).parent}/test_data/non_hrv_shell.zarr.zip"
     with zarr.storage.ZipStore(shell_path, mode="r") as store:
         ds = xr.open_zarr(store)
 
     # Remove original time dim
     ds = ds.drop_vars("time")
 
     # Add new times so they lead up to present
-    times = pd.date_range(
-        test_t0 - pd.Timedelta("3h"),
-        test_t0,
-        freq=f"{freq_mins}min",
-    )
     ds = ds.expand_dims(time=times)
 
     # Add data to dataset
@@ -51,5 +47,61 @@ def make_sat_data(test_t0, freq_mins):
 
 
 @pytest.fixture()
-def sat_5_data(test_t0):
-    return make_sat_data(test_t0, freq_mins=5)
+def sat_5_data(init_time):
+    times = pd.date_range(
+        init_time - pd.Timedelta("3h"),
+        init_time,
+        freq=f"5min",
+    )
+    return make_sat_data(times)
+
+
+@pytest.fixture()
+def today():
+    return pd.Timestamp.now(tz="UTC").replace(tzinfo=None).floor("1D")
+
+
+@pytest.fixture()
+def init_times_tuple(today) -> tuple[pd.DatetimeIndex, pd.DatetimeIndex]:
+    init_times_day1 = pd.date_range(today - pd.Timedelta("2D"), freq=FORECAST_FREQ, periods=3)
+    init_times_day2 = pd.date_range(today - pd.Timedelta("1D"), freq=FORECAST_FREQ, periods=3)
+    return init_times_day1, init_times_day2
+
+
+@pytest.fixture()
+def forecast_directory(tmp_path_factory, init_times_tuple) -> str:
+    pred_dir = str(tmp_path_factory.mktemp("pred_dir"))
+
+    all_init_times = [t for ts in init_times_tuple for t in ts]
+
+    for init_time in all_init_times:
+        ds_pred = make_sat_data(times=init_time+FORECAST_STEPS)
+        ds_pred = ds_pred.assign_coords(step=("time", FORECAST_STEPS))
+        ds_pred = ds_pred.swap_dims({"time":"step"}).drop_vars("time")
+        ds_pred = ds_pred.expand_dims({"init_time": [init_time]})
+        ds_pred = ds_pred.rename({"data": "sat_pred"})
+
+        zarr_path = init_time.strftime(f"{pred_dir}/%Y-%m-%dT%H:%M.zarr")
+        ds_pred.to_zarr(zarr_path)
+
+    yield pred_dir
+
+@pytest.fixture()
+def sat_icechunk_path(tmp_path, init_times_tuple) -> str:
+    sat_icechunk_path = str(tmp_path / "sat.icechunk")
+
+    all_init_times = [t for ts in init_times_tuple for t in ts]
+
+    sat_times = set([t for init_time in all_init_times for t in (init_time+FORECAST_STEPS)])
+    sat_times = pd.to_datetime(sorted(sat_times))
+    
+    ds_sat = make_sat_data(sat_times)
+
+    store = icechunk.local_filesystem_storage(sat_icechunk_path)
+    repo = icechunk.Repository.create(store)
+    session = repo.writable_session(branch="main")
+
+    to_icechunk(ds_sat, session)
+    session.commit("Commit test data")
+
+    yield sat_icechunk_path
@@ -7,7 +7,7 @@
 from cloudcasting_app.app import app
 
 
-def test_app(sat_5_data, tmp_path, test_t0):
+def test_app(sat_5_data, tmp_path, init_time):
 
     os.chdir(tmp_path)
 
@@ -23,7 +23,7 @@ def test_app(sat_5_data, tmp_path, test_t0):
 
     # Check the two output files have been created
     latest_zarr_path = f"{tmp_path}/latest.zarr"
-    t0_string_zarr_path = test_t0.strftime(f"{tmp_path}/%Y-%m-%dT%H:%M.zarr")
+    t0_string_zarr_path = init_time.strftime(f"{tmp_path}/%Y-%m-%dT%H:%M.zarr")
     assert os.path.exists(latest_zarr_path)
     assert os.path.exists(t0_string_zarr_path)
 
@@ -37,7 +37,7 @@ def test_app(sat_5_data, tmp_path, test_t0):
     )
 
     # Make sure all the coords are correct
-    assert ds_y_hat.init_time == test_t0
+    assert ds_y_hat.init_time == init_time
     assert len(ds_y_hat.step)==12
     assert (ds_y_hat.x_geostationary==sat_5_data.x_geostationary).all()
     assert (ds_y_hat.y_geostationary==sat_5_data.y_geostationary).all()