~vincent-vincentdavis/statsmodels/sum-stats-devel3

« back to all changes in this revision

Viewing changes to scikits/statsmodels/tsa/arma_mle.py

Committer: Vincent Davis
Date: 2010-10-17 03:41:15 UTC
mfrom: (2020.1.11 statsmodels-devel)
Revision ID: vincent@vincentdavis.net-20101017034115-w4ycsu053uy5i706

merged with devel

files added:
scikits/statsmodels/examples/tsa

scikits/statsmodels/examples/tsa/ex_arma.py

scikits/statsmodels/examples/tsa/iterate.dat

scikits/statsmodels/graphics

scikits/statsmodels/graphics/tsaplots.py

scikits/statsmodels/miscmodels/try_mlecov.py

scikits/statsmodels/nonparametric

scikits/statsmodels/resampling

scikits/statsmodels/sandbox/mcevaluate

scikits/statsmodels/sandbox/mcevaluate/arma.py

scikits/statsmodels/sandbox/stats/tests/test_weightstats.py

scikits/statsmodels/sandbox/tsa/notes_organize.txt

scikits/statsmodels/stats

scikits/statsmodels/tsa/arma_mle.py

scikits/statsmodels/tsa/mlemodel.py

scikits/statsmodels/tsa/tests/results/AROLSNoConstantPredict.csv

scikits/statsmodels/tsa/y_arma22.txt

tools

files renamed:
scikits/statsmodels/sandbox/regression/ex_mle_arma.py => scikits/statsmodels/sandbox/tsa/examples/ex_mle_arma.py

scikits/statsmodels/sandbox/regression/ex_mle_garch.py => scikits/statsmodels/sandbox/tsa/examples/ex_mle_garch.py

scikits/statsmodels/sandbox/regression/mle.py => scikits/statsmodels/sandbox/tsa/garch.py

scikits/statsmodels/sandbox/tsa/arima.py => scikits/statsmodels/tsa/arima_process.py

scikits/statsmodels/sandbox/tsa/varma_tools.py => scikits/statsmodels/tsa/varma_process.py

files modified:
scikits/statsmodels/decorators.py

scikits/statsmodels/discretemod.py

scikits/statsmodels/examples/tut_ols.py

scikits/statsmodels/glm.py

scikits/statsmodels/model.py

scikits/statsmodels/sandbox/examples/bayesprior.py

scikits/statsmodels/sandbox/regression/__init__.py

scikits/statsmodels/sandbox/regression/numdiff.py

scikits/statsmodels/sandbox/regression/try_ols_anova.py

scikits/statsmodels/sandbox/smoothers.py

scikits/statsmodels/sandbox/stats/distributions_extras.py

scikits/statsmodels/sandbox/stats/tests/testtransf.py

scikits/statsmodels/sandbox/stats/weightstats.py

scikits/statsmodels/sandbox/tests/test_pcatsa.py

scikits/statsmodels/sandbox/tests/test_tsa_tools.py

scikits/statsmodels/sandbox/tsa/__init__.py

scikits/statsmodels/sandbox/tsa/example_arma.py

scikits/statsmodels/sandbox/tsa/kalmanf.py

scikits/statsmodels/sandbox/tsa/varma.py

scikits/statsmodels/tsa/stattools.py

scikits/statsmodels/tsa/tests/results/results_ar.py

scikits/statsmodels/tsa/tests/test_ar.py

scikits/statsmodels/tsa/tests/test_stattools.py

scikits/statsmodels/tsa/tests/test_var.py

scikits/statsmodels/tsa/tsatools.py

scikits/statsmodels/tsa/var.py

Show diffs side-by-side

added added

removed removed

scikits/statsmodels/tsa/arma_mle.py

"""

Created on Sun Oct 10 14:57:50 2010

Author: josef-pktd, Skipper Seabold

License: BSD

TODO: check everywhere initialization of signal.lfilter

"""

import numpy as np

from scipy import signal, optimize

from scikits.statsmodels.model import LikelihoodModel, GenericLikelihoodModel

#copied from sandbox/regression/mle.py

#rename until merge of classes is complete

class Arma(GenericLikelihoodModel): #switch to generic mle

"""

univariate Autoregressive Moving Average model

Note: This is not working yet, or does it

this can subclass TSMLEModel

"""

def __init__(self, endog, exog=None):

#need to override p,q (nar,nma) correctly

super(Arma, self).__init__(endog, exog)

#set default arma(1,1)

self.nar = 1

self.nma = 1

#self.initialize()

def initialize(self):

pass

def geterrors(self, params):

#copied from sandbox.tsa.arima.ARIMA

p, q = self.nar, self.nma

rhoy = np.concatenate(([1], params[:p]))

rhoe = np.concatenate(([1], params[p:p+q]))

errorsest = signal.lfilter(rhoy, rhoe, self.endog)

return errorsest

def loglike(self, params):

"""

Loglikelihood for arma model

Notes

-----

The ancillary parameter is assumed to be the last element of

the params vector

"""

# #copied from sandbox.tsa.arima.ARIMA

# p = self.nar

# rhoy = np.concatenate(([1], params[:p]))

# rhoe = np.concatenate(([1], params[p:-1]))

# errorsest = signal.lfilter(rhoy, rhoe, self.endog)

errorsest = self.geterrors(params)

sigma2 = np.maximum(params[-1]**2, 1e-6)

axis = 0

nobs = len(errorsest)

#this doesn't help for exploding paths

#errorsest[np.isnan(errorsest)] = 100

# llike = -0.5 * (np.sum(np.log(sigma2),axis)

# + np.sum((errorsest**2)/sigma2, axis)

# + nobs*np.log(2*np.pi))

llike = -0.5 * (nobs*np.log(sigma2)

+ np.sum((errorsest**2)/sigma2, axis)

+ nobs*np.log(2*np.pi))

return llike

#add for Jacobian calculation bsejac in GenericMLE, copied from loglike

def nloglikeobs(self, params):

"""

Loglikelihood for arma model

Notes

-----

The ancillary parameter is assumed to be the last element of

the params vector

"""

# #copied from sandbox.tsa.arima.ARIMA

# p = self.nar

# rhoy = np.concatenate(([1], params[:p]))

# rhoe = np.concatenate(([1], params[p:-1]))

# errorsest = signal.lfilter(rhoy, rhoe, self.endog)

errorsest = self.geterrors(params)

sigma2 = np.maximum(params[-1]**2, 1e-6)

axis = 0

nobs = len(errorsest)

#this doesn't help for exploding paths

#errorsest[np.isnan(errorsest)] = 100

# llike = -0.5 * (np.sum(np.log(sigma2),axis)

100

# + np.sum((errorsest**2)/sigma2, axis)

101

# + nobs*np.log(2*np.pi))

102

llike = 0.5 * (np.log(sigma2)

103

+ (errorsest**2)/sigma2

104

+ np.log(2*np.pi))

105

return llike

106

107

#use generic instead

108

# def score(self, params):

109

# """

110

# Score vector for Arma model

111

# """

112

# #return None

113

# #print params

114

# jac = ndt.Jacobian(self.loglike, stepMax=1e-4)

115

# return jac(params)[-1]

116

117

118

#use generic instead

119

# def hessian(self, params):

120

# """

121

# Hessian of arma model. Currently uses numdifftools

122

# """

123

# #return None

124

# Hfun = ndt.Jacobian(self.score, stepMax=1e-4)

125

# return Hfun(params)[-1]

126

127

#copied from arima.ARIMA, needs splitting out of method specific code

128

def fit(self, order=(0,0,0), method="ls", rhoy0=None, rhoe0=None):

129

'''

130

Estimate lag coefficients of an ARIMA process.

131

132

Parameters

133

----------

134

order : sequence

135

p,d,q where p is the number of AR lags, d is the number of

136

differences to induce stationarity, and q is the number of

137

MA lags to estimate.

138

method : str {"ls", "ssm"}

139

Method of estimation. LS is conditional least squares.

140

SSM is state-space model and the Kalman filter is used to

141

maximize the exact likelihood.

142

rhoy0, rhoe0 : array_like (optional)

143

starting values for estimation

144

145

Returns

146

-------

147

rh, cov_x, infodict, mesg, ier : output of scipy.optimize.leastsq

148

rh :

149

estimate of lag parameters, concatenated [rhoy, rhoe]

150

cov_x :

151

unscaled (!) covariance matrix of coefficient estimates

152

'''

153

if not hasattr(order, '__iter__'):

154

raise ValueError("order must be an iterable sequence. Got type \

155

%s instead" % type(order))

156

157

p,d,q = order

158

self.nar = p # needed for geterrors, needs cleanup

159

self.nma = q

160

161

if d > 0:

162

raise ValueError("Differencing not implemented yet")

163

# assume no constant, ie mu = 0

164

# unless overwritten then use w_bar for mu

165

Y = np.diff(endog, d, axis=0) #TODO: handle lags?

166

167

x = self.endog.squeeze() # remove the squeeze might be needed later

168

# def errfn( rho):

169

# #rhoy, rhoe = rho

170

# rhoy = np.concatenate(([1], rho[:p]))

171

# rhoe = np.concatenate(([1], rho[p:]))

172

# etahatr = signal.lfilter(rhoy, rhoe, x)

173

# #print rho,np.sum(etahatr*etahatr)

174

# return etahatr

175

176

#replace with start_params

177

if rhoy0 is None:

178

rhoy0 = 0.5 * np.ones(p)

179

if rhoe0 is None:

180

rhoe0 = 0.5 * np.ones(q)

181

182

method = method.lower()

183

184

if method == "ls":

185

#changes: use self.geterrors (nobs,):

186

# rh, cov_x, infodict, mesg, ier = \

187

# optimize.leastsq(errfn, np.r_[rhoy0, rhoe0],ftol=1e-10,full_output=True)

188

rh, cov_x, infodict, mesg, ier = \

189

optimize.leastsq(self.geterrors, np.r_[rhoy0, rhoe0],ftol=1e-10,full_output=True)

190

#TODO: need missing parameter estimates for LS, scale, residual-sdt

191

#TODO: integrate this into the MLE.fit framework?

192

elif method == "ssm":

193

pass

194

else: #this is also conditional least squares

195

# fmin_bfgs is slow or doesn't work yet

196

errfnsum = lambda rho : np.sum(self.geterrors(rho)**2)

197

#xopt, {fopt, gopt, Hopt, func_calls, grad_calls

198

rh, fopt, gopt, cov_x, _,_, ier = \

199

optimize.fmin_bfgs(errfnsum, np.r_[rhoy0, rhoe0], maxiter=2, full_output=True)

200

infodict, mesg = None, None

201

self.params = rh

202

self.ar_est = np.concatenate(([1], rh[:p]))

203

self.ma_est = np.concatenate(([1], rh[p:])) #rh[-q:])) doesnt work for q=0

204

self.error_estimate = self.geterrors(rh)

205

return rh, cov_x, infodict, mesg, ier

206

207

208

#renamed and needs check with other fit

209

def fit_mle(self, start_params=None, maxiter=5000, method='nm', tol=1e-08):

210

if start_params is None:

211

start_params = np.concatenate((0.05*np.ones(self.nar + self.nma), [1]))

212

mlefit = super(Arma, self).fit(start_params=start_params,

213

maxiter=maxiter, method=method, tol=tol)

214

return mlefit

215

216

#copied from arima.ARIMA

217

def predicted(self, ar=None, ma=None):

218

'''past predicted values of time series

219

just added, not checked yet

220

'''

221

222

# #ar, ma not used, not useful as arguments for predicted pattern

223

# #need it for prediction for other time series, endog

224

# if ar is None:

225

# ar = self.ar_est

226

# if ma is None:

227

# ma = self.ma_est

228

return self.x + self.error_estimate

229

230

#copied from arima.ARIMA

231

def forecast(self, ar=None, ma=None, nperiod=10):

232

'''nperiod ahead forecast at the end of the data period

233

'''

234

eta = np.r_[self.error_estimate, np.zeros(nperiod)]

235

if ar is None:

236

ar = self.ar_est

237

if ma is None:

238

ma = self.ma_est

239

return signal.lfilter(ma, ar, eta)

240

241

#copied from arima.ARIMA

242

#TODO: is this needed as a method at all?

243

#JP: not needed in this form, but can be replace with using the parameters

244

@classmethod

245

def generate_sample(cls, ar, ma, nsample, std=1):

246

eta = std * np.random.randn(nsample)

247

return signal.lfilter(ma, ar, eta)

248

Older »