pip install tslearn[all_features]

from sklearn.cluster import KMeans
from tslearn.utils import to_sklearn_dataset

X_sklearn = to_sklearn_dataset(X_train)
model = KMeans(n_clusters=3, max_iter=10, random_state=0)
model.fit(X_sklearn)
plot_clustering(model, X_sklearn)

from tslearn.metrics import dtw_path

path, sim = dtw_path(s_y1, s_y2)
plot_dtw(s_y1, s_y2, path)

from tslearn.clustering import TimeSeriesKMeans

model = TimeSeriesKMeans(n_clusters=3, metric="dtw", 
                         max_iter=10, random_state=0)
model.fit(X_train)
plot_clustering(model, X_train)

from sklearn.model_selection import GridSearchCV, StratifiedKFold
from sklearn.pipeline import Pipeline
from tslearn.neighbors import KNeighborsTimeSeriesClassifier
from tslearn.preprocessing import TimeSeriesScalerMeanVariance

n_splits=3
pipeline = GridSearchCV(
    Pipeline([
            ('normalize', TimeSeriesScalerMeanVariance()),
            ('knn', KNeighborsTimeSeriesClassifier())
    ]),
    {'knn__n_neighbors': [2, 5, 25],
     'knn__weights': ['uniform', 'distance']},
    cv=StratifiedKFold(n_splits=n_splits, 
                       shuffle=True, 
                       random_state=42)
)

pipeline.fit(X_train, y_train)

import pandas as pd
pd.DataFrame(
    pipeline.cv_results_, 
    columns=['param_knn__n_neighbors', 
             'param_knn__weights', 
             'mean_test_score']
)

pipeline.best_params_

{'knn__n_neighbors': 5, 'knn__weights': 'distance'}

# We will extract 2 shapelets and align them with the time series
shapelet_sizes = {20: 2}

# Define the model and fit it using the training data
shp_clf = LearningShapelets(n_shapelets_per_size=shapelet_sizes,
                            weight_regularizer=0.0001,
                            optimizer=Adam(0.01),
                            max_iter=300,
                            verbose=0,
                            scale=True,
                            random_state=42)
shp_clf.fit(X_train, y_train)

@misc{tslearn,
      title={tslearn: A machine learning toolkit dedicated to time-series
             data},
      author={Romain Tavenard and Johann Faouzi and Gilles Vandewiele and
              Felix Divo and Guillaume Androz and Chester Holtz and Marie
              Payne and Roman Yurchak and Marc Ru{\ss}wurm and Kushal
              Kolar and Eli Woods},
      year={2017},
      note={\url{https://github.com/tslearn-team/tslearn}}
}

time series + ML + Python = ❤️ (& `tslearn`)¶

What's `tslearn`?¶

Why use a dedicated library for time series?¶

Use time series metrics¶

$k$-means + DTW¶

Benefit from great `scikit-learn` features¶

And now for something very similar¶

What's next¶

If you use `tslearn`, please cite us!¶

Q & A¶

	param_knn__n_neighbors	param_knn__weights	mean_test_score
0	2	uniform	0.640931
1	2	distance	0.740196
2	5	uniform	0.681373
3	5	distance	0.762255
4	25	uniform	0.617647
5	25	distance	0.738971

time series + ML + Python = ❤️ (& tslearn)¶

What's tslearn?¶

Why use a dedicated library for time series?¶

Use time series metrics¶

$k$-means + DTW¶

Benefit from great scikit-learn features¶

And now for something very similar¶

What's next¶

If you use tslearn, please cite us!¶

Q & A¶

time series + ML + Python = ❤️ (& `tslearn`)¶

What's `tslearn`?¶

Benefit from great `scikit-learn` features¶

If you use `tslearn`, please cite us!¶