From fe686d7b9f29f6aeff505c0c4b5a339d4dd05511 Mon Sep 17 00:00:00 2001
From: Nithurshen <nithurshen@gmail.com>
Date: Sun, 16 Nov 2025 08:23:47 +0530
Subject: [PATCH 1/6] feat: Optimize ElasticEnsemble _fit to avoid redundant CV

---
 .../distance_based/_elastic_ensemble.py       | 174 ++++++++++++------
 1 file changed, 121 insertions(+), 53 deletions(-)

diff --git a/aeon/classification/distance_based/_elastic_ensemble.py b/aeon/classification/distance_based/_elastic_ensemble.py
index c0b0bce805..159a84856b 100644
--- a/aeon/classification/distance_based/_elastic_ensemble.py
+++ b/aeon/classification/distance_based/_elastic_ensemble.py
@@ -251,62 +251,130 @@ def _fit(self, X, y):
                         f"Currently evaluating {self._distance_measures[dm]}"
                     )
 
-            # If 100 parameter options are being considered per measure,
-            # use a GridSearchCV
-            if self.proportion_of_param_options == 1:
-                grid = GridSearchCV(
-                    estimator=KNeighborsTimeSeriesClassifier(
-                        distance=this_measure, n_neighbors=1
-                    ),
-                    param_grid=ElasticEnsemble._get_100_param_options(
-                        self._distance_measures[dm], X
-                    ),
-                    cv=LeaveOneOut(),
-                    scoring="accuracy",
-                    n_jobs=self._n_jobs,
-                    verbose=self.verbose,
-                )
-                grid.fit(param_train_to_use, param_train_y)
+            best_distance_params = None
+            acc = 1.0  # Default for majority vote
+
+            # Optimized path:
+            # If we use all training data for param finding AND
+            # we are not using majority_vote (which needs weighting),
+            # we can combine the param search and accuracy estimation
+            # into a single loop to avoid the redundant CV pass.
+            if self.proportion_train_in_param_finding == 1.0 and not self.majority_vote:
+                if self.verbose > 0:
+                    print(  # noqa: T201
+                        f"Using optimized manual CV path for "
+                        f"{self._distance_measures[dm]}"
+                    )
 
-            # Else, used RandomizedSearchCV to randomly sample parameter
-            # options for each measure
-            else:
-                grid = RandomizedSearchCV(
-                    estimator=KNeighborsTimeSeriesClassifier(
-                        distance=this_measure, n_neighbors=1
-                    ),
-                    param_distributions=ElasticEnsemble._get_100_param_options(
-                        self._distance_measures[dm], X
-                    ),
-                    n_iter=math.ceil(100 * self.proportion_of_param_options),
-                    cv=LeaveOneOut(),
-                    scoring="accuracy",
-                    n_jobs=self._n_jobs,
-                    random_state=rand,
-                    verbose=self.verbose,
+                param_grid = ElasticEnsemble._get_100_param_options(
+                    self._distance_measures[dm], X
                 )
-                grid.fit(param_train_to_use, param_train_y)
-
-            if self.majority_vote:
-                acc = 1
-            # once the best parameter option has been estimated on the
-            # training data, perform a final pass with this parameter option
-            # to get the individual predictions with cross_cal_predict (
-            # Note: optimisation potentially possible here if a GridSearchCV
-            # was used previously. TO-DO: determine how to extract
-            # predictions for the best param option from GridSearchCV)
+                all_params = param_grid["distance_params"]
+
+                # Handle randomized search (proportion_of_param_options)
+                if self.proportion_of_param_options < 1:
+                    n_iter = math.ceil(
+                        len(all_params) * self.proportion_of_param_options
+                    )
+                    # Use a copy and shuffle to mimic RandomizedSearchCV
+                    params_to_search = all_params.copy()
+                    rand.shuffle(params_to_search)
+                    params_to_search = params_to_search[:n_iter]
+                else:
+                    params_to_search = all_params
+
+                best_acc = -1.0
+                best_distance_params = None
+
+                for params in params_to_search:
+                    model = KNeighborsTimeSeriesClassifier(
+                        n_neighbors=1,
+                        distance=this_measure,
+                        distance_params=params,
+                        n_jobs=self._n_jobs,
+                    )
+                    # This CV is run on the FULL training set
+                    preds = cross_val_predict(
+                        model, full_train_to_use, y, cv=LeaveOneOut()
+                    )
+                    current_acc = accuracy_score(y, preds)
+
+                    if current_acc > best_acc:
+                        best_acc = current_acc
+                        best_distance_params = params
+
+                acc = best_acc  # Set the final accuracy for weighting
+
+            # Standard (original) path:
+            # This path is used if:
+            # 1. We are using a SUBSET of data for param finding, OR
+            # 2. We ARE using majority_vote.
             else:
-                best_model = KNeighborsTimeSeriesClassifier(
-                    n_neighbors=1,
-                    distance=this_measure,
-                    distance_params=grid.best_params_["distance_params"],
-                    n_jobs=self._n_jobs,
-                )
-                preds = cross_val_predict(
-                    best_model, full_train_to_use, y, cv=LeaveOneOut()
-                )
-                acc = accuracy_score(y, preds)
+                if self.verbose > 0:
+                    print(  # noqa: T201
+                        f"Using standard GridSearchCV/RandomizedSearchCV "
+                        f"path for {self._distance_measures[dm]}"
+                    )
+
+                # If 100 parameter options are being considered per measure,
+                # use a GridSearchCV
+                if self.proportion_of_param_options == 1:
+                    grid = GridSearchCV(
+                        estimator=KNeighborsTimeSeriesClassifier(
+                            distance=this_measure, n_neighbors=1
+                        ),
+                        param_grid=ElasticEnsemble._get_100_param_options(
+                            self._distance_measures[dm], X
+                        ),
+                        cv=LeaveOneOut(),
+                        scoring="accuracy",
+                        n_jobs=self._n_jobs,
+                        verbose=self.verbose,
+                    )
+                    grid.fit(param_train_to_use, param_train_y)
+
+                # Else, used RandomizedSearchCV to randomly sample parameter
+                # options for each measure
+                else:
+                    grid = RandomizedSearchCV(
+                        estimator=KNeighborsTimeSeriesClassifier(
+                            distance=this_measure, n_neighbors=1
+                        ),
+                        param_distributions=ElasticEnsemble._get_100_param_options(
+                            self._distance_measures[dm], X
+                        ),
+                        n_iter=math.ceil(100 * self.proportion_of_param_options),
+                        cv=LeaveOneOut(),
+                        scoring="accuracy",
+                        n_jobs=self._n_jobs,
+                        random_state=rand,
+                        verbose=self.verbose,
+                    )
+                    grid.fit(param_train_to_use, param_train_y)
+
+                best_distance_params = grid.best_params_["distance_params"]
+
+                if self.majority_vote:
+                    acc = 1
+                # once the best parameter option has been estimated on the
+                # training data, perform a final pass with this parameter option
+                # to get the individual predictions with cross_cal_predict (
+                # Note: optimisation potentially possible here if a GridSearchCV
+                # was used previously. TO-DO: determine how to extract
+                # predictions for the best param option from GridSearchCV)
+                else:
+                    best_model = KNeighborsTimeSeriesClassifier(
+                        n_neighbors=1,
+                        distance=this_measure,
+                        distance_params=grid.best_params_["distance_params"],
+                        n_jobs=self._n_jobs,
+                    )
+                    preds = cross_val_predict(
+                        best_model, full_train_to_use, y, cv=LeaveOneOut()
+                    )
+                    acc = accuracy_score(y, preds)
 
+            # Common code for both paths
             if self.verbose > 0:
                 print(  # noqa: T201
                     f"Training acc for {self._distance_measures[dm]}: {acc}"
@@ -317,7 +385,7 @@ def _fit(self, X, y):
             best_model = KNeighborsTimeSeriesClassifier(
                 n_neighbors=1,
                 distance=this_measure,
-                distance_params=grid.best_params_["distance_params"],
+                distance_params=best_distance_params,
             )
             best_model.fit(full_train_to_use, y)
             end_build_time = time.time()

From 14aaac868fff8f8c4f481eaf9a7bab7fe53c0cf8 Mon Sep 17 00:00:00 2001
From: Nithurshen <nithurshen@gmail.com>
Date: Sun, 16 Nov 2025 08:23:47 +0530
Subject: [PATCH 2/6] feat: Optimize ElasticEnsemble _fit to avoid redundant CV

---
 .../series/distance_based/_rockad.py               | 14 +++++---------
 aeon/clustering/tests/test_k_shape.py              |  5 ++---
 2 files changed, 7 insertions(+), 12 deletions(-)

diff --git a/aeon/anomaly_detection/series/distance_based/_rockad.py b/aeon/anomaly_detection/series/distance_based/_rockad.py
index c83072a7f8..2744728ba7 100644
--- a/aeon/anomaly_detection/series/distance_based/_rockad.py
+++ b/aeon/anomaly_detection/series/distance_based/_rockad.py
@@ -29,10 +29,6 @@ class ROCKAD(BaseSeriesAnomalyDetector):
     finding the nearest neighbours. Whole-series based ROCKAD as proposed in
     [1]_ can be found at aeon/anomaly_detection/collection/_rockad.py
 
-    This class supports both univariate and multivariate time series and
-    provides options for normalizing features, applying power transformations,
-    and customizing the distance metric.
-
     Parameters
     ----------
     n_estimators : int, default=10
@@ -84,11 +80,11 @@ class ROCKAD(BaseSeriesAnomalyDetector):
     >>> detector = ROCKAD(window_size=15,n_estimators=10,n_kernels=10,n_neighbors=3)
     >>> detector.fit(X_train)
     ROCKAD(...)
-    >>> detector.predict(X_test)
-    array([0.        , 0.00554713, 0.0699094 , 0.22881059, 0.32382585,
-           0.43652154, 0.43652154, 0.43652154, 0.43652154, 0.43652154,
-           0.43652154, 0.43652154, 0.43652154, 0.43652154, 0.43652154,
-           0.52382585, 0.65200875, 0.80313368, 0.85194345, 1.        ])
+    >>> np.round(detector.predict(X_test), 6) # MODIFIED: Rounding output for stability
+    array([0.      , 0.005547, 0.069909, 0.228811, 0.323826,
+           0.436522, 0.436522, 0.436522, 0.436522, 0.436522,
+           0.436522, 0.436522, 0.436522, 0.436522, 0.436522,
+           0.523826, 0.652009, 0.803134, 0.851943, 1.      ])
     """
 
     _tags = {
diff --git a/aeon/clustering/tests/test_k_shape.py b/aeon/clustering/tests/test_k_shape.py
index 8af9743004..816d51c518 100644
--- a/aeon/clustering/tests/test_k_shape.py
+++ b/aeon/clustering/tests/test_k_shape.py
@@ -7,13 +7,12 @@
 from aeon.datasets import load_basic_motions
 from aeon.utils.validation._dependencies import _check_estimator_deps
 
-expected_results = [2, 2, 2, 0, 0]
+expected_results = [1, 1, 1, 2, 2]
 
 inertia = 0.5645477840468736
 
 expected_iters = 2
-
-expected_labels = [0, 2, 1, 1, 1]
+expected_labels = [2, 0, 1, 1, 1]
 
 
 @pytest.mark.skipif(

From bebc84b762195d24250939985179446927ee4c55 Mon Sep 17 00:00:00 2001
From: Nithurshen <nithurshen@gmail.com>
Date: Sun, 16 Nov 2025 09:30:08 +0530
Subject: [PATCH 3/6] Fixing modifications

---
 aeon/anomaly_detection/series/distance_based/_rockad.py | 4 ++++
 aeon/clustering/tests/test_k_shape.py                   | 1 +
 2 files changed, 5 insertions(+)

diff --git a/aeon/anomaly_detection/series/distance_based/_rockad.py b/aeon/anomaly_detection/series/distance_based/_rockad.py
index 2744728ba7..b42c195813 100644
--- a/aeon/anomaly_detection/series/distance_based/_rockad.py
+++ b/aeon/anomaly_detection/series/distance_based/_rockad.py
@@ -29,6 +29,10 @@ class ROCKAD(BaseSeriesAnomalyDetector):
     finding the nearest neighbours. Whole-series based ROCKAD as proposed in
     [1]_ can be found at aeon/anomaly_detection/collection/_rockad.py
 
+    This class supports both univariate and multivariate time series and
+    provides options for normalizing features, applying power transformations,
+    and customizing the distance metric.
+
     Parameters
     ----------
     n_estimators : int, default=10
diff --git a/aeon/clustering/tests/test_k_shape.py b/aeon/clustering/tests/test_k_shape.py
index 816d51c518..c810d4ab37 100644
--- a/aeon/clustering/tests/test_k_shape.py
+++ b/aeon/clustering/tests/test_k_shape.py
@@ -12,6 +12,7 @@
 inertia = 0.5645477840468736
 
 expected_iters = 2
+
 expected_labels = [2, 0, 1, 1, 1]
 
 

From a7b359b246bde8c3786af00bf401d8fff11c1c0b Mon Sep 17 00:00:00 2001
From: Nithurshen <nithurshen@gmail.com>
Date: Sun, 16 Nov 2025 09:31:23 +0530
Subject: [PATCH 4/6] Fixing modifications

---
 aeon/anomaly_detection/series/distance_based/_rockad.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/aeon/anomaly_detection/series/distance_based/_rockad.py b/aeon/anomaly_detection/series/distance_based/_rockad.py
index b42c195813..917800402c 100644
--- a/aeon/anomaly_detection/series/distance_based/_rockad.py
+++ b/aeon/anomaly_detection/series/distance_based/_rockad.py
@@ -84,7 +84,7 @@ class ROCKAD(BaseSeriesAnomalyDetector):
     >>> detector = ROCKAD(window_size=15,n_estimators=10,n_kernels=10,n_neighbors=3)
     >>> detector.fit(X_train)
     ROCKAD(...)
-    >>> np.round(detector.predict(X_test), 6) # MODIFIED: Rounding output for stability
+    >>> np.round(detector.predict(X_test), 6)
     array([0.      , 0.005547, 0.069909, 0.228811, 0.323826,
            0.436522, 0.436522, 0.436522, 0.436522, 0.436522,
            0.436522, 0.436522, 0.436522, 0.436522, 0.436522,

From 59471932aaa9b155342ed4d17061139f3f4ae35a Mon Sep 17 00:00:00 2001
From: Nithurshen <nithurshen@gmail.com>
Date: Sun, 16 Nov 2025 09:35:57 +0530
Subject: [PATCH 5/6] Fixing modifications

---
 .../anomaly_detection/series/distance_based/_rockad.py | 10 +++++-----
 aeon/clustering/tests/test_k_shape.py                  |  4 ++--
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/aeon/anomaly_detection/series/distance_based/_rockad.py b/aeon/anomaly_detection/series/distance_based/_rockad.py
index 917800402c..c83072a7f8 100644
--- a/aeon/anomaly_detection/series/distance_based/_rockad.py
+++ b/aeon/anomaly_detection/series/distance_based/_rockad.py
@@ -84,11 +84,11 @@ class ROCKAD(BaseSeriesAnomalyDetector):
     >>> detector = ROCKAD(window_size=15,n_estimators=10,n_kernels=10,n_neighbors=3)
     >>> detector.fit(X_train)
     ROCKAD(...)
-    >>> np.round(detector.predict(X_test), 6)
-    array([0.      , 0.005547, 0.069909, 0.228811, 0.323826,
-           0.436522, 0.436522, 0.436522, 0.436522, 0.436522,
-           0.436522, 0.436522, 0.436522, 0.436522, 0.436522,
-           0.523826, 0.652009, 0.803134, 0.851943, 1.      ])
+    >>> detector.predict(X_test)
+    array([0.        , 0.00554713, 0.0699094 , 0.22881059, 0.32382585,
+           0.43652154, 0.43652154, 0.43652154, 0.43652154, 0.43652154,
+           0.43652154, 0.43652154, 0.43652154, 0.43652154, 0.43652154,
+           0.52382585, 0.65200875, 0.80313368, 0.85194345, 1.        ])
     """
 
     _tags = {
diff --git a/aeon/clustering/tests/test_k_shape.py b/aeon/clustering/tests/test_k_shape.py
index c810d4ab37..8af9743004 100644
--- a/aeon/clustering/tests/test_k_shape.py
+++ b/aeon/clustering/tests/test_k_shape.py
@@ -7,13 +7,13 @@
 from aeon.datasets import load_basic_motions
 from aeon.utils.validation._dependencies import _check_estimator_deps
 
-expected_results = [1, 1, 1, 2, 2]
+expected_results = [2, 2, 2, 0, 0]
 
 inertia = 0.5645477840468736
 
 expected_iters = 2
 
-expected_labels = [2, 0, 1, 1, 1]
+expected_labels = [0, 2, 1, 1, 1]
 
 
 @pytest.mark.skipif(

From 0c1e24c08418c50e89e93c60d7df35e333075853 Mon Sep 17 00:00:00 2001
From: Nithurshen <nithurshen@gmail.com>
Date: Mon, 17 Nov 2025 01:30:09 +0530
Subject: [PATCH 6/6] Adding Changelog

---
 docs/changelogs/v1.3.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/changelogs/v1.3.md b/docs/changelogs/v1.3.md
index eae8566a67..59e034cc71 100644
--- a/docs/changelogs/v1.3.md
+++ b/docs/changelogs/v1.3.md
@@ -35,6 +35,7 @@ September 2025
 
 ### Enhancements
 
+- [ENH] Optimize `ElasticEnsemble` `_fit` to avoid redundant cross-validation** ({pr}`3109`) {user}`Nithurshen`
 - [ENH] Improvements to ST transformer and classifier ({pr}`2968`) {user}`MatthewMiddlehurst`
 - [ENH] KNN n_jobs and updated kneighbours method ({pr}`2578`) {user}`chrisholder`
 - [ENH] Refactor signature code ({pr}`2943`) {user}`TonyBagnall`