test for once and 1pace eval_ways

OuyangWenyu · OuyangWenyu · commit cab2e2ac1f73 · 2025-04-21T17:23:03.000+08:00
diff --git a/torchhydro/configs/config.py b/torchhydro/configs/config.py
@@ -1269,6 +1269,8 @@ def update_cfg(cfg_file, new_args):
         cfg_file["training_cfgs"]["lr_scheduler"] = new_args.lr_scheduler
     if new_args.valid_batch_mode is not None:
         cfg_file["training_cfgs"]["valid_batch_mode"] = new_args.valid_batch_mode
+    if new_args.evaluator is not None:
+        cfg_file["evaluation_cfgs"]["evaluator"] = new_args.evaluator
     # print("the updated config:\n", json.dumps(cfg_file, indent=4, ensure_ascii=False))
 
 
diff --git a/torchhydro/datasets/data_sets.py b/torchhydro/datasets/data_sets.py
@@ -654,6 +654,7 @@ def _create_lookup_table(self):
         for basin in tqdm(range(basin_coordinates), file=sys.stdout, disable=False):
             if not self.train_mode:
                 # we don't need to ignore those with full nan in target vars for prediction without loss calculation
+                # all samples should be included so that we can recover results to specified basins easily
                 lookup.extend(
                     (basin, f)
                     for f in range(warmup_length, max_time_length - rho - horizon + 1)
diff --git a/torchhydro/trainers/train_utils.py b/torchhydro/trainers/train_utils.py
@@ -13,7 +13,6 @@
 import os
 import re
 import shutil
-import dask
 from functools import reduce
 from pathlib import Path
 import pandas as pd
@@ -280,6 +279,9 @@ def get_evaluation(
             )
         else:
             # TODO: need more test
+            raise NotImplementedError(
+                "we only support the case that the stride is equal to 1 now, others need to be implemented"
+            )
             obss_xr = _rolling_once_evaluate(
                 (basin_num, horizon, nf),
                 target_scaler.rho,
@@ -297,17 +299,14 @@ def get_evaluation(
                 output.reshape(batch_size, horizon, nf),
             )
     elif evaluator["eval_way"] == "1pace":
-        # TODO: to be implemented
-        # in this case, you should set calc_metrics = False in the evaluation config or use BasinBatchSampler in your data config
-        # baceuse we need to calculate the metrics for each time step
-        # but we have multi-outputs for each time step in this case
-        o = output[:, length + prec, :].reshape(basin_num, batch_size, len(target_col))
-        l = labels[:, length + prec, :].reshape(basin_num, batch_size, len(target_col))
-        valdataset = valorte_data_loader.dataset
-        preds_xr = valdataset.denormalize(output)
-        obss_xr = valdataset.denormalize(labels)
-        obs = obss_xr[col].to_numpy()
-        pred = preds_xr[col].to_numpy()
+        pace_idx = evaluator["pace_idx"]
+        # for 1pace with pace_idx meaning which value of output was chosen to show
+        # 1st, we need to transpose data to 4-dim to show the whole data
+        pred = _recover_samples_to_basin(output, valorte_data_loader, pace_idx)
+        obs = _recover_samples_to_basin(labels, valorte_data_loader, pace_idx)
+        valte_dataset = valorte_data_loader.dataset
+        preds_xr = valte_dataset.denormalize(pred)
+        obss_xr = valte_dataset.denormalize(obs)
     elif evaluator["eval_way"] == "rolling":
         # TODO: to be implemented
         raise NotImplementedError(
@@ -318,6 +317,46 @@ def get_evaluation(
     return obss_xr, preds_xr
 
 
+def _recover_samples_to_basin(arr_3d, valorte_data_loader, pace_idx):
+    """Reorganize the 3D prediction results by basin
+
+    Parameters
+    ----------
+    arr_3d : np.ndarray
+        A 3D prediction array with the shape (total number of samples, number of time steps, number of features).
+    valorte_data_loader: DataLoader
+        The corresponding data loader used to obtain the basin-time index mapping.
+    pace_idx: int
+        Which time step was chosen to show.
+
+    Returns
+        -------
+        np.ndarray
+            The reorganized 3D array with the shape (number of basins, length of time, number of features).
+    """
+    dataset = valorte_data_loader.dataset
+    basin_num = len(dataset.t_s_dict["sites_id"])
+    nt = dataset.nt
+    rho = dataset.rho
+    warmup_len = dataset.warmup_length
+    horizon = dataset.horizon
+    nf = dataset.noutputvar
+
+    basin_array = np.full((basin_num, nt, nf), np.nan)
+
+    for sample_idx in range(arr_3d.shape[0]):
+        # Get the basin and start time index corresponding to this sample
+        basin, start_time = dataset.lookup_table[sample_idx]
+        # Take the value at the last time step of this sample (at the position of rho + horizon)
+        value = arr_3d[sample_idx, pace_idx, :]
+        # Calculate the time position in the result array
+        result_time_idx = start_time + warmup_len + rho + horizon + pace_idx
+        # Fill in the corresponding position
+        basin_array[basin, result_time_idx, :] = value
+
+    return basin_array
+
+
 def evaluate_validation(
     validation_data_loader,
     output,