openclimatefix · zaryab-ali · Feb 13, 2025 · Feb 14, 2025 · Feb 23, 2025 · Feb 24, 2025
diff --git a/scripts/backtest_sites.py b/scripts/backtest_sites.py
@@ -35,6 +35,7 @@
 import xarray as xr
 from huggingface_hub import hf_hub_download
 from huggingface_hub.constants import CONFIG_NAME, PYTORCH_WEIGHTS_NAME
+from ocf_data_sampler.config import load_yaml_configuration
 from ocf_data_sampler.torch_datasets.datasets.site import SitesDataset
 from omegaconf import DictConfig
 from torch.utils.data import DataLoader
@@ -161,7 +162,7 @@ def get_sites_ds(config_path: str) -> xr.Dataset:
 class ModelPipe:
     """A class to conveniently make and process predictions from batches"""
 
-    def __init__(self, model, ds_site: xr.Dataset):
+    def __init__(self, model, ds_site: xr.Dataset, config_path: str):
         """A class to conveniently make and process predictions from batches
 
         Args:
@@ -170,6 +171,7 @@ def __init__(self, model, ds_site: xr.Dataset):
         """
         self.model = model
         self.ds_site = ds_site
+        self.config_path = config_path
 
     def predict_batch(self, sample: dict) -> xr.Dataset:
         """Run the sample through the model and compile the predictions into an xarray DataArray
@@ -183,14 +185,20 @@ def predict_batch(self, sample: dict) -> xr.Dataset:
         # Convert sample to tensor and move to device
         sample_tensor = {k: torch.from_numpy(v).to(device) for k, v in sample.items()}
 
+        config = load_yaml_configuration(self.config_path)
+
+        interval_start = np.timedelta64(config.input_data.site.interval_start_minutes, "m")
+        interval_end = np.timedelta64(config.input_data.site.interval_end_minutes, "m")
+        time_resolution = np.timedelta64(config.input_data.site.time_resolution_minutes, "m")
+
         t0 = pd.Timestamp(sample["site_init_time_utc"][0])
         site_id = sample["site_id"][0]
 
         # Get valid times for this forecast
         valid_times = pd.date_range(
-            start=t0 + pd.Timedelta(minutes=FREQ_MINS),
-            periods=len(sample["site_target_time_utc"]),
-            freq=f"{FREQ_MINS}min",
+            start=t0 + pd.Timedelta(interval_start),
+            end=t0 + pd.Timedelta(interval_end),
+            freq=f"{time_resolution.astype(int)}min",
         )
 
         # Get capacity for this site
@@ -280,7 +288,7 @@ def main(config: DictConfig):
     model = model.eval().to(device)
 
     # Create object to make predictions
-    model_pipe = ModelPipe(model, ds_site)
+    model_pipe = ModelPipe(model, ds_site, config.datamodule.configuration)
 
     # Loop through the samples
     pbar = tqdm(total=len(dataset))