time-series-machine-learning
diff --git a/‎.codecov.yml‎
Lines changed: 4 additions & 0 deletions b/‎.codecov.yml‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎.github/workflows/tests.yml‎
Lines changed: 28 additions & 2 deletions b/‎.github/workflows/tests.yml‎
Lines changed: 28 additions & 2 deletions
diff --git a/‎.pre-commit-config.yaml‎
Lines changed: 7 additions & 7 deletions b/‎.pre-commit-config.yaml‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎LICENSE‎
Lines changed: 1 addition & 1 deletion b/‎LICENSE‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/conf.py‎
Lines changed: 1 addition & 1 deletion b/‎docs/conf.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pyproject.toml‎
Lines changed: 4 additions & 3 deletions b/‎pyproject.toml‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎requirements.txt‎
Lines changed: 0 additions & 1 deletion b/‎requirements.txt‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎tsml/base.py‎
Lines changed: 52 additions & 53 deletions b/‎tsml/base.py‎
Lines changed: 52 additions & 53 deletions
diff --git a/‎tsml/convolution_based/__init__.py‎
Lines changed: 2 additions & 0 deletions b/‎tsml/convolution_based/__init__.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎tsml/datasets/EqualMinimalJapaneseVowels/EqualMinimalJapaneseVowels_TEST.ts‎
Lines changed: 1 addition & 1 deletion b/‎tsml/datasets/EqualMinimalJapaneseVowels/EqualMinimalJapaneseVowels_TEST.ts‎
Lines changed: 1 addition & 1 deletion
@@ -16,6 +16,10 @@ coverage:
 # post comment on PR
 comment: false
 
+# enable codecov to report to GitHub status checks
+github_checks:
+  annotations: false
+
 # ignore files
 ignore:
   - ".github/"
 
@@ -28,7 +28,13 @@ jobs:
           extra_args: --files ${{ steps.file_changes.outputs.files }}
 
   pytest:
-    runs-on: ubuntu-latest
+    runs-on: ${{ matrix.os }}
+
+    strategy:
+      matrix:
+        os: [ ubuntu-latest, macOS-latest, windows-latest ]
+        python-version: [ '3.8', '3.9', '3.10' ]
+
     steps:
       - uses: actions/checkout@v3
 
@@ -37,9 +43,29 @@ jobs:
           python-version: "3.10"
 
       - name: Install
-        run: python -m pip install .[dev]
+        run: python -m pip install .[dev,optional_dependencies]
 
       - name: Tests
         run: python -m pytest
 
+
+  codecov:
+    runs-on: ubuntu-latest
+
+    steps:
+      - uses: actions/checkout@v3
+
+      - uses: actions/setup-python@v4
+        with:
+          python-version: "3.10"
+
+      - name: Disable Numba JIT
+        run: echo "NUMBA_DISABLE_JIT=1" >> $GITHUB_ENV
+
+      - name: Install
+        run: python -m pip install .[dev,optional_dependencies]
+
+      - name: Tests
+        run: python -m pytest --cov=tsml --cov-report=xml
+
       - uses: codecov/codecov-action@v3
@@ -1,6 +1,6 @@
 repos:
   - repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v4.3.0
+    rev: v4.4.0
     hooks:
     - id: check-added-large-files
       args: ["--maxkb=10000"]
@@ -15,26 +15,26 @@ repos:
     - id: trailing-whitespace
 
   - repo: https://github.com/pycqa/isort
-    rev: 5.10.1
+    rev: 5.12.0
     hooks:
       - id: isort
         name: isort (python)
         args: ["--profile=black"]
 
   - repo: https://github.com/psf/black
-    rev: 22.10.0
+    rev: 23.1.0
     hooks:
       - id: black
         language_version: python3
 
   - repo: https://github.com/pycqa/flake8
-    rev: 5.0.4
+    rev: 6.0.0
     hooks:
       - id: flake8
         additional_dependencies: [ flake8-bugbear, flake8-print, Flake8-pyproject ]
 
   - repo: https://github.com/nbQA-dev/nbQA
-    rev: 1.5.3
+    rev: 1.6.1
     hooks:
       - id: nbqa-isort
         additional_dependencies: [ isort==5.10.1 ]
@@ -47,14 +47,14 @@ repos:
         args: [ "--nbqa-dont-skip-bad-cells", "--extend-ignore=E402,E203" ]
 
   - repo: https://github.com/pycqa/pydocstyle
-    rev: 6.1.1
+    rev: 6.3.0
     hooks:
       - id: pydocstyle
         args: ["--convention=numpy", "--match=^((?!_wip).)*$"]
         additional_dependencies: [ toml ]
 
   - repo: https://github.com/pre-commit/mirrors-mypy
-    rev: v0.991
+    rev: v1.0.1
     hooks:
       - id: mypy
         files: tsml_estimator_evaluation/
 
@@ -1,6 +1,6 @@
 BSD 3-Clause License
 
-Copyright (c) 2022 - 2023, The Time Series Machine Learning (tsml) developers.
+Copyright (c) The Time Series Machine Learning (tsml) developers.
 All rights reserved.
 
 Redistribution and use in source and binary forms, with or without
 
@@ -38,7 +38,7 @@
 # https://www.sphinx-doc.org/en/master/usage/configuration.html#project-information
 
 project = "tsml"
-copyright = "2022 - 2023, The tsml developers (BSD-3 License)"
+copyright = "The tsml developers (BSD-3 License)"
 author = "Matthew Middlehurst"
 
 
 
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "tsml"
-version = "0.0.1"
+version = "0.0.2"
 description = "A toolkit for time series machine learning algorithms."
 authors = [
     {name = "Matthew Middlehurst", email = "m.middlehurst@uea.ac.uk"},
@@ -41,6 +41,9 @@ dependencies = [
 ]
 
 [project.optional-dependencies]
+optional_dependencies = [
+    "pycatch22",
+]
 dev = [
     "pre-commit",
     "pytest",
@@ -90,6 +93,4 @@ addopts = '''
     --showlocals
     --doctest-modules
     --numprocesses auto
-    --cov tsml
-    --cov-report xml
 '''
@@ -1,13 +1,15 @@
 # -*- coding: utf-8 -*-
+"""Base classes for estimators."""
 
 __author__ = ["MatthewMiddlehurst"]
 __all__ = [
     "BaseTimeSeriesEstimator",
-    "clone_estimator",
+    "_clone_estimator",
 ]
 
-from typing import Union
+from typing import Tuple, Union
 
+import numpy as np
 from numpy.random import RandomState
 from sklearn.base import BaseEstimator, clone
 from sklearn.ensemble._base import _set_random_states
@@ -18,69 +20,64 @@
 
 
 class BaseTimeSeriesEstimator(BaseEstimator):
+    """Base class for time series estimators in tsml."""
+
     def _validate_data(
         self,
-        X="no_validation",
-        y="no_validation",
-        reset=True,
+        X: object = "no_validation",
+        y: object = "no_validation",
+        reset: bool = True,
         **check_params,
-    ):
+    ) -> Union[
+        Tuple[np.ndarray, object],
+        Tuple[list[np.ndarray], object],
+        np.ndarray,
+        list[np.ndarray],
+    ]:
         """Validate input data and set or check the `n_features_in_` attribute.
 
         Uses the `scikit-learn` 1.2.1 `_validate_data` function as a base.
 
         Parameters
         ----------
-        X : {array-like, sparse matrix, dataframe} of shape \
-                (n_samples, n_features), default='no validation'
-            The input samples.
+        X : ndarray or list of ndarrays of shape (n_samples, n_dimensions, \
+                series_length), array-like, or 'no validation', default='no validation'
+            The input samples. ideally a 3D numpy array or a list of 2D numpy
+            arrays.
             If `'no_validation'`, no validation is performed on `X`. This is
             useful for meta-estimator which can delegate input validation to
             their underlying estimator(s). In that case `y` must be passed and
-            the only accepted `check_params` are `multi_output` and
-            `y_numeric`.
-
-        y : array-like of shape (n_samples,), default='no_validation'
-            The targets.
+            the only accepted `check_params` are `y_numeric`.
+        y : array-like of shape (n_samples,), 'no_validation' or None, \
+                default='no_validation'
+            The target labels.
 
-            - If `None`, `check_array` is called on `X`. If the estimator's
+            - If `None`, `check_X` is called on `X`. If the estimator's
               requires_y tag is True, then an error will be raised.
-            - If `'no_validation'`, `check_array` is called on `X` and the
+            - If `'no_validation'`, `check_X` is called on `X` and the
               estimator's requires_y tag is ignored. This is a default
               placeholder and is never meant to be explicitly set. In that case
               `X` must be passed.
             - Otherwise, only `y` with `_check_y` or both `X` and `y` are
-              checked with either `check_array` or `check_X_y` depending on
-              `validate_separately`.
-
+              checked with either `check_X_y`.
         reset : bool, default=True
             Whether to reset the `n_features_in_` attribute.
             If False, the input will be checked for consistency with data
             provided when reset was last True.
             .. note::
-               It is recommended to call reset=True in `fit` and in the first
-               call to `partial_fit`. All other methods that validate `X`
-               should set `reset=False`.
-
-        validate_separately : False or tuple of dicts, default=False
-            Only used if y is not None.
-            If False, call validate_X_y(). Else, it must be a tuple of kwargs
-            to be used for calling check_array() on X and y respectively.
-
-            `estimator=self` is automatically added to these dicts to generate
-            more informative error message in case of invalid input data.
-
+               It is recommended to call reset=True in `fit`. All other methods that
+               validate `X` should set `reset=False`.
         **check_params : kwargs
-            Parameters passed to :func:`sklearn.utils.check_array` or
-            :func:`sklearn.utils.check_X_y`. Ignored if validate_separately
-            is not False.
+            Parameters passed to :func:`tsml.utils.validation.check_X`,
+            `sklearn.utils.validation._check_y` or
+            :func:`tsml.utils.validation.check_X_y`.
 
             `estimator=self` is automatically added to these params to generate
             more informative error message in case of invalid input data.
 
         Returns
         -------
-        out : {ndarray, sparse matrix} or tuple of these
+        out : np.ndarray, list of np.ndarray or tuple of these
             The validated input. A tuple is returned if both `X` and `y` are
             validated.
         """
@@ -90,7 +87,7 @@ def _validate_data(
                 "requires y to be passed, but the target y is None."
             )
 
-        no_val_X = X is None or (isinstance(X, str) and X == "no_validation")
+        no_val_X = isinstance(X, str) and X == "no_validation"
         no_val_y = y is None or (isinstance(y, str) and y == "no_validation")
 
         default_check_params = {"estimator": self}
@@ -112,24 +109,26 @@ def _validate_data(
 
         return out
 
-    def _check_n_features(self, X, reset):
+    def _check_n_features(self, X: Union[np.ndarray, list[np.ndarray]], reset: bool):
         """Set the `n_features_in_` attribute, or check against it.
 
         Uses the `scikit-learn` 1.2.1 `_check_n_features` function as a base.
 
         Parameters
         ----------
-        X : {ndarray, sparse matrix} of shape (n_samples, n_features)
-            The input samples.
+        X : ndarray or list of ndarrays of shape \
+                (n_samples, n_dimensions, series_length)
+            The input samples. Should be a 3D numpy array or a list of 2D numpy
+            arrays.
         reset : bool
-            If True, the `n_features_in_` attribute is set to `X.shape[1]`.
+            If True, the `n_features_in_` attribute is set to
+            `(n_dimensions, min_series_length, max_series_length)`.
             If False and the attribute exists, then check that it is equal to
-            `X.shape[1]`. If False and the attribute does *not* exist, then
-            the check is skipped.
+            `(n_dimensions, min_series_length, max_series_length)`.
+            If False and the attribute does *not* exist, then the check is skipped.
             .. note::
-               It is recommended to call reset=True in `fit` and in the first
-               call to `partial_fit`. All other methods that validate `X`
-               should set `reset=False`.
+               It is recommended to call reset=True in `fit`. All other methods that
+               validate `X` should set `reset=False`.
         """
         try:
             n_features = _num_features(X)
@@ -167,11 +166,13 @@ def _check_n_features(self, X, reset):
                 f"is expecting {self.n_features_in_[1]} series length as input."
             )
 
-    def _more_tags(self):
+    def _more_tags(self) -> dict:
         return _DEFAULT_TAGS
 
     @classmethod
-    def get_test_params(cls, parameter_set=None):
+    def get_test_params(
+        cls, parameter_set: Union[str, None] = None
+    ) -> Union[dict, list[dict]]:
         """Return unit test parameter settings for the estimator.
 
         Parameters
@@ -182,11 +183,8 @@ def get_test_params(cls, parameter_set=None):
 
         Returns
         -------
-        params : dict or list of dict, default = {}
-            Parameters to create testing instances of the class
-            Each dict are parameters to construct an "interesting" test instance, i.e.,
-            `MyClass(**params)` or `MyClass(**params[i])` creates a valid test instance.
-            `create_test_instance` uses the first (or only) dictionary in `params`
+        params : dict or list of dict
+            Parameters to create testing instances of the class.
         """
         if parameter_set is None:
             # default parameters = empty dict
@@ -197,9 +195,10 @@ def get_test_params(cls, parameter_set=None):
             )
 
 
-def clone_estimator(
+def _clone_estimator(
     base_estimator: BaseEstimator, random_state: Union[None, int, RandomState] = None
 ) -> BaseEstimator:
+    """Clone an estimator and set the random state if available."""
     estimator = clone(base_estimator)
 
     if random_state is not None:
 
@@ -0,0 +1,2 @@
+# -*- coding: utf-8 -*-
+"""Convolution based estimators."""
@@ -1,7 +1,7 @@
 % This is a cut down version of the problem JapaneseVowels, useful for code examples and unit tests
 % http://www.timeseriesclassification.com/description.php?Dataset=JapaneseVowels
 % The train set is reduced from 270 cases to 20 cases and the test set is reduced from 370 to 20
-% The dataset has been transformed into an equal length version, with 24 length
+% The dataset has been transformed into an equal length version, with 25 length
 %
 @problemName EqualMinimalJapaneseVowels
 @timestamps false
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+# -- coding: utf-8 --`
	`2`	`+"""Convolution based estimators."""`
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,7 @@`
`1`	`1`	`% This is a cut down version of the problem JapaneseVowels, useful for code examples and unit tests`
`2`	`2`	`% http://www.timeseriesclassification.com/description.php?Dataset=JapaneseVowels`
`3`	`3`	`% The train set is reduced from 270 cases to 20 cases and the test set is reduced from 370 to 20`
`4`		`-% The dataset has been transformed into an equal length version, with 24 length`
	`4`	`+% The dataset has been transformed into an equal length version, with 25 length`
`5`	`5`	`%`
`6`	`6`	`@problemName EqualMinimalJapaneseVowels`
`7`	`7`	`@timestamps false`