Using Theil-Sen estimator

In non-parametric statistics, the Theil–Sen estimator is a method for robustly fitting a line to sample points in the plane (simple linear regression) by choosing the median of the slopes of all lines through pairs of points.

 # Libraries
 import numpy as np
 import pandas as pd

 # Libraries.
 import matplotlib.pyplot as plt

 # Import pyamr
 from pyamr.datasets.load import make_timeseries
 from pyamr.core.regression.theilsens import TheilSensWrapper

 # Set pandas configuration.
 pd.set_option('display.max_colwidth', 14)
 pd.set_option('display.width', 150)
 pd.set_option('display.precision', 4)

 def make_line(length, offset, slope):
     """Create straight series."""
     # Create timeseries.
     x = np.arange(length)
     y = np.random.rand(length) * slope + offset + x
     return x, y

 # ----------------------------
 # create data
 # ----------------------------
 # Constants
 length = 100
 offset = 100
 slope = 10

 # Create series
 #x, y = make_line(length, offset, slope)

 # Create timeseries data
 x, y, f = make_timeseries()

 # Create object
 theilsens = TheilSensWrapper().fit(x=x, y=y)

 # Print series.
 print("\nSeries:")
 print(theilsens.as_series())

 # Print summary.
 print("\nSummary:")
 print(theilsens.as_summary())

Series:
theilsens-slope               3.7184
theilsens-intercept         237.4303
theilsens-ci_lower            3.0622
theilsens-ci_upper            4.3009
theilsens-x            [0, 1, 2, ...
theilsens-y            [40.118153...
theilsens-model        (3.7183711...
theilsens-id               THEILSENS
dtype: object

Summary:
         TheilSens Slope
==================================
slope:                      3.7184
intercept:                237.4303
ci_lower:                   3.0622
ci_upper:                   4.3009
==================================

Lets visualise the predictions

 # -----------------
 #  Predictions
 # -----------------
 # Variables.
 start, end, = None, 180

 # Compute predictions.
 preds = theilsens.get_prediction(start=start, end=end)

 # Create figure
 fig, ax = plt.subplots(1, 1, figsize=(11,5))

 # Plot truth values.
 ax.plot(x, y, color='#A6CEE3', alpha=0.5, marker='o',
          markeredgecolor='k', markeredgewidth=0.5,
          markersize=5, linewidth=0.75, label='Observed')

 # Plot forecasted values.
 ax.plot(preds[0, :], preds[1, :], color='#FF0000', alpha=1.00,
          linewidth=2.0, label=theilsens._identifier())

 # Plot the confidence intervals.
 ax.fill_between(preds[0, :],
                 preds[2, :],
                 preds[3, :],
                 color='r',
                 alpha=0.1)

 # Legend
 plt.legend()

 # Show
 plt.show()

Let’s perform Grid Search

 # ----------
 # Grid search
 # -----------
 # Grid parameters.
 grid_params = {'x': [x], 'y': [y], 'alpha': [0.05, 0.1]}

 # Get summary.
 summary = TheilSensWrapper().grid_search_dataframe(grid_params=grid_params)

 # Plot result
 #print("Grid Search:")
 #print(summary)

117 summary

	0	1
theilsens-slope	3.7184	3.7184
theilsens-intercept	237.4303	237.4303
theilsens-ci_lower	3.0622	3.1688
theilsens-ci_upper	4.3009	4.218
theilsens-alpha	0.05	0.1
theilsens-x	[0, 1, 2, ...	[0, 1, 2, ...
theilsens-y	[40.118153...	[40.118153...
theilsens-model	(3.7183711...	(3.7183711...
theilsens-id	THEILSENS	THEILSENS

Total running time of the script: ( 0 minutes 0.088 seconds)

Gallery generated by Sphinx-Gallery