started working on adaptation

aeon-toolkit · Jul 12, 2024 · 43993de · 43993de
1 parent 3a01b53
commit 43993de
Show file tree

Hide file tree

Showing 7 changed files with 268 additions and 11 deletions.
diff --git a/aeon/clustering/averaging/__init__.py b/aeon/clustering/averaging/__init__.py
@@ -5,9 +5,11 @@
     "mean_average",
     "petitjean_barycenter_average",
     "subgradient_barycenter_average",
+    "holdit_barycenter_average",
     "VALID_BA_METRICS",
 ]
 from aeon.clustering.averaging._averaging import mean_average
+from aeon.clustering.averaging._ba_holdit import holdit_barycenter_average
 from aeon.clustering.averaging._ba_petitjean import petitjean_barycenter_average
 from aeon.clustering.averaging._ba_subgradient import subgradient_barycenter_average
 from aeon.clustering.averaging._ba_utils import VALID_BA_METRICS

diff --git a/aeon/clustering/averaging/_ba_holdit.py b/aeon/clustering/averaging/_ba_holdit.py
@@ -0,0 +1,229 @@
+from typing import Optional, Union
+
+import numpy as np
+from numba import njit
+from sklearn.utils import check_random_state
+
+from aeon.clustering.averaging._ba_utils import (
+    _get_alignment_path,
+    _get_init_barycenter,
+)
+
+
+def holdit_barycenter_average(
+    X: np.ndarray,
+    distance: str = "dtw",
+    max_iters: int = 30,
+    tol=1e-5,
+    init_barycenter: Union[np.ndarray, str] = "mean",
+    initial_step_size: float = 0.05,
+    final_step_size: float = 0.005,
+    weights: Optional[np.ndarray] = None,
+    precomputed_medoids_pairwise_distance: Optional[np.ndarray] = None,
+    verbose: bool = False,
+    random_state: Optional[int] = None,
+    num_ts_to_use_percentage: float = 0.5,
+    **kwargs,
+) -> np.ndarray:
+    """Compute the stochastic subgradient barycenter average of time series.
+
+    Parameters
+    ----------
+    X: np.ndarray, of shape (n_cases, n_channels, n_timepoints) or
+            (n_cases, n_timepoints)
+        A collection of time series instances to take the average from.
+    distance: str, default='dtw'
+        String defining the distance to use for averaging. Distance to
+        compute similarity between time series. A list of valid strings for metrics
+        can be found in the documentation form
+        :func:`aeon.distances.get_distance_function`.
+    max_iters: int, default=30
+        Maximum number iterations for dba to update over.
+    tol : float (default: 1e-5)
+        Tolerance to use for early stopping: if the decrease in cost is lower
+        than this value, the Expectation-Maximization procedure stops.
+    init_barycenter: np.ndarray or, default=None
+        The initial barycenter to use for the minimisation. If a np.ndarray is provided
+        it must be of shape ``(n_channels, n_timepoints)``. If a str is provided it must
+        be one of the following: ['mean', 'medoids', 'random'].
+    initial_step_size : float (default: 0.05)
+        Initial step size for the subgradient descent algorithm.
+        Default value is suggested by [2]_.
+    final_step_size : float (default: 0.005)
+        Final step size for the subgradient descent algorithm.
+        Default value is suggested by [2]_.
+    weights: Optional[np.ndarray] of shape (n_cases,), default=None
+        The weights associated to each time series instance, if None a weight
+        of 1 will be associated to each instance.
+    precomputed_medoids_pairwise_distance: np.ndarray (of shape (len(X), len(X)),
+                default=None
+        Precomputed medoids pairwise.
+    verbose: bool, default=False
+        Boolean that controls the verbosity.
+    random_state: int or None, default=None
+        Random state to use for the barycenter averaging.
+    num_ts_to_use_percentage: float, default=0.5
+        Percentage of time series to use in each iteration.
+    **kwargs
+        Keyword arguments to pass to the distance metric.
+
+    Returns
+    -------
+    np.ndarray of shape (n_channels, n_timepoints)
+        Time series that is the average of the collection of instances provided.
+
+    References
+    ----------
+    .. [1] F. Petitjean, A. Ketterlin & P. Gancarski. A global averaging method
+       for dynamic time warping, with applications to clustering. Pattern
+       Recognition, Elsevier, 2011, Vol. 44, Num. 3, pp. 678-693
+    .. [2] D. Schultz and B. Jain. Nonsmooth Analysis and Subgradient Methods
+       for Averaging in Dynamic Time Warping Spaces.
+       Pattern Recognition, 74, 340-358.
+    """
+    if len(X) <= 1:
+        return X
+
+    if X.ndim == 3:
+        _X = X
+    elif X.ndim == 2:
+        _X = X.reshape((X.shape[0], 1, X.shape[1]))
+    else:
+        raise ValueError("X must be a 2D or 3D array")
+
+    if weights is None:
+        weights = np.ones(len(_X))
+
+    barycenter = _get_init_barycenter(
+        _X,
+        init_barycenter,
+        distance,
+        precomputed_medoids_pairwise_distance,
+        random_state,
+        **kwargs,
+    )
+
+    random_state = check_random_state(random_state)
+
+    cost_prev = np.inf
+    if distance == "wdtw" or distance == "wddtw":
+        if "g" not in kwargs:
+            kwargs["g"] = 0.05
+
+    current_step_size = initial_step_size
+    X_size = _X.shape[0]
+
+    num_ts_to_use = min(X_size, max(10, int(num_ts_to_use_percentage * X_size)))
+
+    for i in range(max_iters):
+        shuffled_indices = random_state.permutation(X_size)[:num_ts_to_use]
+        barycenter, cost, current_step_size = _ba_one_iter_subgradient(
+            barycenter,
+            _X,
+            shuffled_indices,
+            distance,
+            initial_step_size,
+            final_step_size,
+            current_step_size,
+            weights,
+            i,
+            **kwargs,
+        )
+        if abs(cost_prev - cost) < tol:
+            break
+        elif cost_prev < cost:
+            break
+        else:
+            cost_prev = cost
+
+        if verbose:
+            print(f"[DBA] epoch {i}, cost {cost}")  # noqa: T001, T201
+    return barycenter
+
+
+@njit(cache=True, fastmath=True)
+def _ba_one_iter_subgradient(
+    barycenter: np.ndarray,
+    X: np.ndarray,
+    shuffled_indices: np.ndarray,
+    distance: str = "dtw",
+    initial_step_size: float = 0.05,
+    final_step_size: float = 0.005,
+    current_step_size: float = 0.05,
+    weights: Optional[np.ndarray] = None,
+    iteration: int = 0,
+    window: Union[float, None] = None,
+    g: float = 0.0,
+    epsilon: Union[float, None] = None,
+    nu: float = 0.001,
+    lmbda: float = 1.0,
+    independent: bool = True,
+    c: float = 1.0,
+    descriptor: str = "identity",
+    reach: int = 30,
+    warp_penalty: float = 1.0,
+    transformation_precomputed: bool = False,
+    transformed_x: Optional[np.ndarray] = None,
+    transformed_y: Optional[np.ndarray] = None,
+):
+
+    X_size, X_dims, X_timepoints = X.shape
+    cost = 0.0
+    # Only update current_step_size on the first iteration
+    step_size_reduction = 0.0
+    if iteration == 0:
+        step_size_reduction = (initial_step_size - final_step_size) / X_size
+
+    barycenter_copy = np.copy(barycenter)
+
+    for i in shuffled_indices:
+        curr_ts = X[i]
+        curr_alignment, curr_cost = _get_alignment_path(
+            barycenter_copy,
+            X[i],
+            distance,
+            window,
+            g,
+            epsilon,
+            nu,
+            lmbda,
+            independent,
+            c,
+            descriptor,
+            reach,
+            warp_penalty,
+            transformation_precomputed,
+            transformed_x,
+            transformed_y,
+        )
+
+        new_ba = np.zeros((X_dims, X_timepoints))
+        for j, k in curr_alignment:
+            new_ba[:, k] += barycenter_copy[:, k] - curr_ts[:, j]
+
+        barycenter_copy -= (2.0 * current_step_size) * new_ba * weights[i]
+
+        current_step_size -= step_size_reduction
+        cost = curr_cost * weights[i]
+    return barycenter_copy, cost, current_step_size
+
+
+if __name__ == "__main__":
+    from aeon.clustering.averaging import elastic_barycenter_average
+    from aeon.testing.data_generation import make_example_3d_numpy
+
+    X_train = make_example_3d_numpy(4, 2, 10, random_state=1, return_y=False)
+    distance = "dtw"
+
+    average_ts = elastic_barycenter_average(
+        X_train, distance=distance, window=0.2, independent=False
+    )
+
+    subgradient_ts = elastic_barycenter_average(
+        X_train, distance=distance, window=0.2, independent=False, method="subgradient"
+    )
+
+    holdit_ts = elastic_barycenter_average(
+        X_train, distance=distance, window=0.2, independent=False, method="holdit"
+    )
+    stop = ""
diff --git a/aeon/clustering/averaging/_barycenter_averaging.py b/aeon/clustering/averaging/_barycenter_averaging.py
@@ -4,6 +4,7 @@
 
 import numpy as np
 
+from aeon.clustering.averaging._ba_holdit import holdit_barycenter_average
 from aeon.clustering.averaging._ba_petitjean import petitjean_barycenter_average
 from aeon.clustering.averaging._ba_subgradient import subgradient_barycenter_average
 
@@ -21,6 +22,7 @@ def elastic_barycenter_average(
     precomputed_medoids_pairwise_distance: Optional[np.ndarray] = None,
     verbose: bool = False,
     random_state: Optional[int] = None,
+    holdit_num_ts_to_use_percentage: float = 0.5,
     **kwargs,
 ) -> np.ndarray:
     """Compute the barycenter average of time series using a elastic distance.
@@ -128,6 +130,22 @@ def elastic_barycenter_average(
             random_state=random_state,
             **kwargs,
         )
+    elif method == "holdit":
+        return holdit_barycenter_average(
+            X,
+            distance=distance,
+            max_iters=max_iters,
+            tol=tol,
+            init_barycenter=init_barycenter,
+            initial_step_size=initial_step_size,
+            final_step_size=final_step_size,
+            weights=weights,
+            precomputed_medoids_pairwise_distance=precomputed_medoids_pairwise_distance,
+            verbose=verbose,
+            random_state=random_state,
+            num_ts_to_use_percentage=holdit_num_ts_to_use_percentage,
+            **kwargs,
+        )
     else:
         raise ValueError(
             f"Invalid method: {method}. Please use one of the following: "

diff --git a/aeon/clustering/averaging/tests/test_dba.py b/aeon/clustering/averaging/tests/test_dba.py
@@ -218,10 +218,16 @@ def test_elastic_dba_variations(distance):
         X_train, distance=distance, window=0.2, independent=False, method="subgradient"
     )
 
+    holdit_ts = elastic_barycenter_average(
+        X_train, distance=distance, window=0.2, independent=False, method="holdit"
+    )
+
     assert isinstance(average_ts, np.ndarray)
     assert isinstance(subgradient_ts, np.ndarray)
+    assert isinstance(holdit_ts, np.ndarray)
     assert average_ts.shape == X_train[0].shape
     assert subgradient_ts.shape == X_train[0].shape
+    assert holdit_ts.shape == X_train[0].shape
 
 
 @pytest.mark.parametrize(

diff --git a/examples/datasets/provided_data.ipynb b/examples/datasets/provided_data.ipynb
@@ -242,8 +242,7 @@
    ],
    "metadata": {
     "collapsed": false
-   },
-   "outputs": []
+   }
   },
   {
    "cell_type": "code",
@@ -299,8 +298,7 @@
    ],
    "metadata": {
     "collapsed": false
-   },
-   "outputs": []
+   }
   },
   {
    "cell_type": "code",

diff --git a/examples/segmentation/hidalgo_segmentation.ipynb b/examples/segmentation/hidalgo_segmentation.ipynb
@@ -32,11 +32,20 @@
     "X[60:, 1:] = 0\n",
     "hidalgo = HidalgoSegmenter(K=2, burn_in=0.8, n_iter=1000, seed=10)\n",
     "\n",
-    "hidalgo.fit_predict(X, axis=0)"
+    "hidalgo.fit_predict(X)"
    ],
    "metadata": {
     "collapsed": false
    }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "outputs": [],
+   "source": [],
+   "metadata": {
+    "collapsed": false
+   }
   }
  ],
  "metadata": {

diff --git a/pyproject.toml b/pyproject.toml
@@ -183,12 +183,7 @@ convention = "numpy"
 testpaths = "aeon"
 addopts = '''
     --doctest-modules
-    --durations 20
-    --timeout 600
-    --showlocals
-    --dist worksteal
-    --reruns 2
-    --only-rerun "crashed while running"
+
 '''
 filterwarnings = '''
     ignore::UserWarning