Source code for croston.croston

"""
croston model for intermittent time series
"""

import numpy as np
import pandas as pd
from scipy.optimize import minimize

[docs]def fit_croston( input_endog, forecast_length, croston_variant = 'original' ): """ :param input_endog: numpy array of intermittent demand time series :param forecast_length: forecast horizon :param croston_variant: croston model type :return: dictionary of model parameters, in-sample forecast, and out-of-sample forecast """ input_series = np.asarray(input_endog) epsilon = 1e-7 input_length = len(input_series) nzd = np.where(input_series != 0)[0] if list(nzd) != [0]: try: w_opt = _croston_opt( input_series = input_series, input_series_length = input_length, croston_variant = croston_variant, epsilon = epsilon, w = None, nop = 1 ) croston_training_result = _croston( input_series = input_series, input_series_length = input_length, croston_variant = croston_variant, w = w_opt, h = forecast_length, epsilon = epsilon, ) croston_model = croston_training_result['model'] croston_fittedvalues = croston_training_result['in_sample_forecast'] croston_forecast = croston_training_result['out_of_sample_forecast'] except Exception as e: croston_model = None croston_fittedvalues = None croston_forecast = None print(str(e)) else: croston_model = None croston_fittedvalues = None croston_forecast = None return { 'croston_model': croston_model, 'croston_fittedvalues': croston_fittedvalues, 'croston_forecast': croston_forecast }
[docs]def _croston( input_series, input_series_length, croston_variant, w, h, epsilon ): # Croston decomposition nzd = np.where(input_series != 0)[0] # find location of non-zero demand k = len(nzd) z = input_series[nzd] # demand x = np.concatenate([[nzd[0]], np.diff(nzd)]) # intervals # initialize init = [z[0], np.mean(x)] zfit = np.array([None] * k) xfit = np.array([None] * k) # assign initial values and prameters zfit[0] = init[0] xfit[0] = init[1] if len(w) == 1: a_demand = w[0] a_interval = w[0] else: a_demand = w[0] a_interval = w[1] # compute croston variant correction factors # sba: syntetos-boylan approximation # sbj: shale-boylan-johnston # tsb: teunter-syntetos-babai if croston_variant == 'sba': correction_factor = 1 - (a_interval / 2) elif croston_variant == 'sbj': correction_factor = (1 - a_interval / (2 - a_interval + epsilon)) else: correction_factor = 1 # fit model for i in range(1,k): zfit[i] = zfit[i-1] + a_demand * (z[i] - zfit[i-1]) # demand xfit[i] = xfit[i-1] + a_interval * (x[i] - xfit[i-1]) # interval cc = correction_factor * zfit / (xfit + epsilon) croston_model = { 'a_demand': a_demand, 'a_interval': a_interval, 'demand_series': pd.Series(zfit), 'interval_series': pd.Series(xfit), 'demand_process': pd.Series(cc), 'correction_factor': correction_factor } # calculate in-sample demand rate frc_in = np.zeros(input_series_length) tv = np.concatenate([nzd, [input_series_length]]) # Time vector used to create frc_in forecasts for i in range(k): frc_in[tv[i]:min(tv[i+1], input_series_length)] = cc[i] # forecast out_of_sample demand rate if h > 0: frc_out = np.array([cc[k-1]] * h) else: frc_out = None return_dictionary = { 'model': croston_model, 'in_sample_forecast': frc_in, 'out_of_sample_forecast': frc_out } return return_dictionary
[docs]def _croston_opt( input_series, input_series_length, croston_variant, epsilon, w = None, nop = 1 ): p0 = np.array([0.1] * nop) wopt = minimize( fun = _croston_cost, x0 = p0, method='Nelder-Mead', args=(input_series, input_series_length, croston_variant, epsilon) ) constrained_wopt = np.minimum([1], np.maximum([0], wopt.x)) return constrained_wopt
[docs]def _croston_cost( p0, input_series, input_series_length, croston_variant, epsilon ): # cost function for croston and variants frc_in = _croston( input_series = input_series, input_series_length = input_series_length, croston_variant = croston_variant, w=p0, h=0, epsilon = epsilon )['in_sample_forecast'] E = input_series - frc_in E = E[E != np.array(None)] E = np.mean(E ** 2) return E