#!/usr/bin/python # -*- coding: utf8 -*- import numpy as np from statsmodels.tsa.arima_model import ARIMA as stats_arima import scipy.stats as st from pyFTS import fts class ARIMA(fts.FTS): """ Façade for statsmodels.tsa.arima_model """ def __init__(self, name, **kwargs): super(ARIMA, self).__init__(1, "ARIMA"+name) self.name = "ARIMA" self.detail = "Auto Regressive Integrated Moving Average" self.is_high_order = True self.has_point_forecasting = True self.has_interval_forecasting = True self.model = None self.model_fit = None self.trained_data = None self.p = 1 self.d = 0 self.q = 0 self.benchmark_only = True self.min_order = 1 self.alpha = (1 - kwargs.get("alpha", 0.90))/2 def train(self, data, sets, order, parameters=None): self.p = order[0] self.d = order[1] self.q = order[2] self.order = self.p + self.q self.shortname = "ARIMA(" + str(self.p) + "," + str(self.d) + "," + str(self.q) + ")" old_fit = self.model_fit try: self.model = stats_arima(data, order=(self.p, self.d, self.q)) self.model_fit = self.model.fit(disp=0) print(np.sqrt(self.model_fit.sigma2)) except Exception as ex: print(ex) self.model_fit = None def ar(self, data): return data.dot(self.model_fit.arparams) def ma(self, data): return data.dot(self.model_fit.maparams) def forecast(self, data, **kwargs): if self.model_fit is None: return np.nan ndata = np.array(self.doTransformations(data)) l = len(ndata) ret = [] if self.d == 0: ar = np.array([self.ar(ndata[k - self.p: k]) for k in np.arange(self.p, l+1)]) #+1 to forecast one step ahead given all available lags else: ar = np.array([ndata[k] + self.ar(ndata[k - self.p: k]) for k in np.arange(self.p, l+1)]) if self.q > 0: residuals = np.array([ndata[k] - ar[k - self.p] for k in np.arange(self.p, l)]) ma = np.array([self.ma(residuals[k - self.q: k]) for k in np.arange(self.q, len(residuals)+1)]) ret = ar[self.q:] + ma else: ret = ar ret = self.doInverseTransformations(ret, params=[data[self.order - 1:]]) return ret def forecastInterval(self, data, **kwargs): if self.model_fit is None: return np.nan sigma = np.sqrt(self.model_fit.sigma2) ndata = np.array(self.doTransformations(data)) l = len(ndata) ret = [] for k in np.arange(self.order, l+1): tmp = [] sample = [ndata[i] for i in np.arange(k - self.order, k)] mean = self.forecast(sample)[0] tmp.append(mean + st.norm.ppf(self.alpha) * sigma) tmp.append(mean + st.norm.ppf(1 - self.alpha) * sigma) ret.append(tmp) ret = self.doInverseTransformations(ret, params=[data[self.order - 1:]], interval=True) return ret def forecastAheadInterval(self, data, steps, **kwargs): if self.model_fit is None: return np.nan smoothing = kwargs.get("smoothing",0.2) alpha = (1 - kwargs.get("alpha", 0.95))/2 sigma = np.sqrt(self.model_fit.sigma2) ndata = np.array(self.doTransformations(data)) l = len(ndata) means = self.forecastAhead(data,steps,kwargs) ret = [] for k in np.arange(0, steps): tmp = [] hsigma = (1 + k*smoothing)*sigma tmp.append(means[k] + st.norm.ppf(alpha) * hsigma) tmp.append(means[k] + st.norm.ppf(1 - alpha) * hsigma) ret.append(tmp) ret = self.doInverseTransformations(ret, params=[data[self.order - 1:]]) return ret