SimonBlanke · himelds · Apr 22, 2026 · Apr 25, 2026 · Apr 25, 2026 · Apr 25, 2026
diff --git a/...rfaces/test_functions/machine_learning/hyperparameter_optimization/timeseries/__init__.py b/...rfaces/test_functions/machine_learning/hyperparameter_optimization/timeseries/__init__.py
@@ -11,13 +11,15 @@
     ExpSmoothingForecasterFunction,
     GradientBoostingForecasterFunction,
     RandomForestForecasterFunction,
+    TimeSeriesPipelineForecasterFunction,
 )
 
 __all__ = [
     # Forecasting
     "GradientBoostingForecasterFunction",
     "RandomForestForecasterFunction",
     "ExpSmoothingForecasterFunction",
+    "TimeSeriesPipelineForecasterFunction",
     # Classification
     "RandomForestTSClassifierFunction",
     "KNNTSClassifierFunction",

diff --git a/...functions/machine_learning/hyperparameter_optimization/timeseries/forecasting/__init__.py b/...functions/machine_learning/hyperparameter_optimization/timeseries/forecasting/__init__.py
@@ -6,10 +6,12 @@
     ExpSmoothingForecasterFunction,
     GradientBoostingForecasterFunction,
     RandomForestForecasterFunction,
+    TimeSeriesPipelineForecasterFunction,
 )
 
 __all__ = [
     "GradientBoostingForecasterFunction",
     "RandomForestForecasterFunction",
     "ExpSmoothingForecasterFunction",
+    "TimeSeriesPipelineForecasterFunction",
 ]
diff --git a/...ne_learning/hyperparameter_optimization/timeseries/forecasting/test_functions/__init__.py b/...ne_learning/hyperparameter_optimization/timeseries/forecasting/test_functions/__init__.py
@@ -5,9 +5,10 @@
 from .exp_smoothing_forecaster import ExpSmoothingForecasterFunction
 from .gradient_boosting_forecaster import GradientBoostingForecasterFunction
 from .random_forest_forecaster import RandomForestForecasterFunction
-
+from .time_series_pipeline_forecaster import TimeSeriesPipelineForecasterFunction
 __all__ = [
     "GradientBoostingForecasterFunction",
     "RandomForestForecasterFunction",
     "ExpSmoothingForecasterFunction",
+    "TimeSeriesPipelineForecasterFunction",
 ]
diff --git a/...ter_optimization/timeseries/forecasting/test_functions/time_series_pipeline_forecaster.py b/...ter_optimization/timeseries/forecasting/test_functions/time_series_pipeline_forecaster.py
@@ -0,0 +1,215 @@
+import numpy as np
+from typing import Any, Dict, List, Optional
+from numpy.lib.stride_tricks import sliding_window_view
+
+# Surfaces library base class and data
+from .._base_forecasting import BaseForecasting
+from ..datasets import DATASETS
+
+
+def apply_time_series_features(
+    y: np.ndarray,
+    n_lags: int,
+    rolling_window: int,
+    differencing: int,
+) -> tuple[np.ndarray, np.ndarray]:
+    """
+    Build supervised learning features from a univariate time series.
+
+    Parameters
+    ----------
+    y            : 1-D array of observations (oldest → newest)
+    n_lags       : number of lag features (0 = none)
+    rolling_window: window size for rolling mean/std (0 = skip)
+    differencing : order of differencing applied before feature extraction
+    """
+    if n_lags == 0 and rolling_window == 0:
+        raise ValueError("At least one of n_lags or rolling_window must be > 0.")
+
+    if differencing > 0:
+        y = np.diff(y, n=differencing)
+
+    n_samples = len(y)
+    offset = max(n_lags, rolling_window)
+
+    if n_samples <= offset:
+        raise ValueError(
+            f"Series length {n_samples} is too short for "
+            f"n_lags={n_lags} / rolling_window={rolling_window}."
+        )
+
+    features = []
+
+    # Lag features
+    for lag in range(1, n_lags + 1):
+        features.append(y[offset - lag : n_samples - lag])
+
+    # Vectorised rolling statistics
+    if rolling_window > 0:
+        windows = sliding_window_view(y, window_shape=rolling_window)
+        start = offset - rolling_window
+        features.append(windows[start:].mean(axis=1))
+        features.append(windows[start:].std(axis=1, ddof=1))
+
+    X = np.column_stack(features)
+    y_target = y[offset:]
+
+    return X, y_target
+
+
+class TimeSeriesPipelineForecasterFunction(BaseForecasting):
+    """
+    A hyperparameter-searchable time series forecasting pipeline.
+
+    The objective function returns negative MAE (higher = better).
+    """
+
+    _name_ = "time_series_pipeline_forecaster"
+    _dependencies = {"ml": ["sklearn"]}
+
+    para_names = [
+        "n_lags",
+        "rolling_window",
+        "differencing",
+        "scaler",
+        "model",
+        "model__regularization"
+    ]
+
+    n_lags_default = [3, 5, 7, 10, 14, 21]
+    rolling_window_default = [0, 3, 7, 14]
+    differencing_default = [0, 1, 2]
+    scaler_default = ["none", "standard", "minmax"]
+    model_default = ["ridge", "rf", "gb"]
+    model__regularization_default = [0.001, 0.01, 0.1, 1.0, 10.0]
+
+    def _default_search_space(self) -> Dict[str, List]:
+        """Define the default hyperparameter search space."""
+        return {
+            "n_lags": [3, 5, 7, 10, 14, 21],
+            "rolling_window": [0, 3, 7, 14],
+            "differencing": [0, 1, 2],
+            "scaler": ["none", "standard", "minmax"],
+            "model": ["ridge", "rf", "gb"],
+            "model__regularization": [0.001, 0.01, 0.1, 1.0, 10.0],
+        }
+
+    def _get_surrogate_params(self, params: Dict[str, Any]) -> Dict[str, Any]:
+        """Include fixed parameters for surrogate model support."""
+        return {
+            **params,
+            "dataset": self.dataset,
+            "train_size": self.train_size
+        }
+
+    def __init__(
+        self,
+        dataset: str = "airline",
+        objective: str = "maximize",
+        modifiers: Optional[List] = None,
+        memory: bool = False,
+        collect_data: bool = True,
+        train_size: float = 0.8,
+        **kwargs: Any,
+    ) -> None:
+        if dataset not in DATASETS:
+            raise ValueError(f"Unknown dataset '{dataset}'.")
+        if not 0.0 < train_size < 1.0:
+            raise ValueError("train_size must be between 0 and 1 exclusive.")
+
+        self.dataset = dataset
+        self.train_size = train_size
+        self._dataset_loader = DATASETS[dataset]
+        self._cached_data: Optional[tuple] = None
+
+        super().__init__(
+            objective=objective,
+            modifiers=modifiers,
+            memory=memory,
+            collect_data=collect_data,
+            **kwargs,
+        )
+
+    def _get_training_data(self) -> tuple[np.ndarray, np.ndarray]:
+        """Load and cache the dataset."""
+        if self._cached_data is None:
+            self._cached_data = self._dataset_loader()
+        return self._cached_data
+
+    @staticmethod
+    def _build_scaler(scaler_type: str):
+        """Return a fitted-ready scaler instance with Lazy Import."""
+        from sklearn.preprocessing import StandardScaler, MinMaxScaler
+        if scaler_type == "standard":
+            return StandardScaler()
+        if scaler_type == "minmax":
+            return MinMaxScaler()
+        if scaler_type == "none":
+            return None
+        raise ValueError(f"Unknown scaler type: {scaler_type!r}")
+
+    @staticmethod
+    def _build_model(model_type: str, reg: float):
+        """Construct a scikit-learn regressor."""
+        from sklearn.linear_model import Ridge
+        from sklearn.ensemble import (
+            RandomForestRegressor,
+            GradientBoostingRegressor
+        )
+
+        if model_type == "ridge":
+            return Ridge(alpha=reg)
+        if model_type == "rf":
+            return RandomForestRegressor(
+                n_estimators=100,
+                max_depth=max(1, int(reg)),
+                random_state=42,
+            )
+        if model_type == "gb":
+            return GradientBoostingRegressor(
+                n_estimators=100,
+                learning_rate=float(np.clip(reg, 1e-4, 1.0)),
+                random_state=42,
+            )
+        raise ValueError(f"Unknown model type: {model_type!r}")
+
+    def _ml_objective(self, params: Dict[str, Any]) -> float:
+        """Evaluate a single hyperparameter configuration."""
+        from sklearn.metrics import mean_absolute_error
+
+        _, y_raw = self._get_training_data()
+
+        try:
+            X, y = apply_time_series_features(
+                y_raw,
+                n_lags=params["n_lags"],
+                rolling_window=params["rolling_window"],
+                differencing=params["differencing"],
+            )
+        except ValueError:
+            return -float("inf")
+
+        split_idx = int(len(X) * self.train_size)
+        if split_idx == 0 or split_idx == len(X):
+            return -float("inf")
+
+        X_train, X_test = X[:split_idx], X[split_idx:]
+        y_train, y_test = y[:split_idx], y[split_idx:]
+
+        scaler = self._build_scaler(params["scaler"])
+        if scaler is not None:
+            X_train = scaler.fit_transform(X_train)
+            X_test = scaler.transform(X_test)
+
+        model = self._build_model(params["model"], params["model__regularization"])
+        model.fit(X_train, y_train)
+        mae = mean_absolute_error(y_test, model.predict(X_test))
+
+        return -mae
+
+    def __repr__(self) -> str:
+        return (
+            f"{self.__class__.__name__}("
+            f"dataset={self.dataset!r}, "
+            f"train_size={self.train_size!r})"
+        )
diff --git a/tests/full/suites/test_ml.py b/tests/full/suites/test_ml.py
@@ -413,3 +413,20 @@ def test_polynomial_feature_transformation(self, quick_ml_params):
 
         assert isinstance(result, (int, float))
         assert np.isfinite(result)
+
+@pytest.mark.ml
+class TestTimeSeriesFunctions:
+    """Test time-series ML functions."""
+
+    def test_time_series_pipeline_forecaster(self):
+        """TimeSeriesPipelineForecasterFunction evaluates correctly."""
+
+        from surfaces.test_functions.machine_learning.hyperparameter_optimization.timeseries.forecasting.test_functions.time_series_pipeline_forecaster import TimeSeriesPipelineForecasterFunction
+
+        func = TimeSeriesPipelineForecasterFunction()
+        params = get_sample_params(func)
+
+        result = func(params)
+
+        assert isinstance(result, (int, float))
+        assert np.isfinite(result)