\\\\( \nonumber \newcommand{\bevisslut}{$\blacksquare$} \newenvironment{matr}[1]{\hspace{-.8mm}\begin{bmatrix}\hspace{-1mm}\begin{array}{#1}}{\end{array}\hspace{-1mm}\end{bmatrix}\hspace{-.8mm}} \newcommand{\transp}{\hspace{-.6mm}^{\top}} \newcommand{\maengde}[2]{\left\lbrace \hspace{-1mm} \begin{array}{c|c} #1 & #2 \end{array} \hspace{-1mm} \right\rbrace} \newenvironment{eqnalign}[1]{\begin{equation}\begin{array}{#1}}{\end{array}\end{equation}} \newcommand{\eqnl}{} \newcommand{\matind}[3]{{_\mathrm{#1}\mathbf{#2}_\mathrm{#3}}} \newcommand{\vekind}[2]{{_\mathrm{#1}\mathbf{#2}}} \newcommand{\jac}[2]{{\mathrm{Jacobi}_\mathbf{#1} (#2)}} \newcommand{\diver}[2]{{\mathrm{div}\mathbf{#1} (#2)}} \newcommand{\rot}[1]{{\mathbf{rot}\mathbf{(#1)}}} \newcommand{\am}{\mathrm{am}} \newcommand{\gm}{\mathrm{gm}} \newcommand{\E}{\mathrm{E}} \newcommand{\Span}{\mathrm{span}} \newcommand{\mU}{\mathbf{U}} \newcommand{\mA}{\mathbf{A}} \newcommand{\mB}{\mathbf{B}} \newcommand{\mC}{\mathbf{C}} \newcommand{\mD}{\mathbf{D}} \newcommand{\mE}{\mathbf{E}} \newcommand{\mF}{\mathbf{F}} \newcommand{\mK}{\mathbf{K}} \newcommand{\mI}{\mathbf{I}} \newcommand{\mM}{\mathbf{M}} \newcommand{\mN}{\mathbf{N}} \newcommand{\mQ}{\mathbf{Q}} \newcommand{\mT}{\mathbf{T}} \newcommand{\mV}{\mathbf{V}} \newcommand{\mW}{\mathbf{W}} \newcommand{\mX}{\mathbf{X}} \newcommand{\ma}{\mathbf{a}} \newcommand{\mb}{\mathbf{b}} \newcommand{\mc}{\mathbf{c}} \newcommand{\md}{\mathbf{d}} \newcommand{\me}{\mathbf{e}} \newcommand{\mn}{\mathbf{n}} \newcommand{\mr}{\mathbf{r}} \newcommand{\mv}{\mathbf{v}} \newcommand{\mw}{\mathbf{w}} \newcommand{\mx}{\mathbf{x}} \newcommand{\mxb}{\mathbf{x_{bet}}} \newcommand{\my}{\mathbf{y}} \newcommand{\mz}{\mathbf{z}} \newcommand{\reel}{\mathbb{R}} \newcommand{\mL}{\bm{\Lambda}} \newcommand{\mnul}{\mathbf{0}} \newcommand{\trap}[1]{\mathrm{trap}(#1)} \newcommand{\Det}{\operatorname{Det}} \newcommand{\adj}{\operatorname{adj}} \newcommand{\Ar}{\operatorname{Areal}} \newcommand{\Vol}{\operatorname{Vol}} \newcommand{\Rum}{\operatorname{Rum}} \newcommand{\diag}{\operatorname{\bf{diag}}} \newcommand{\bidiag}{\operatorname{\bf{bidiag}}} \newcommand{\spanVec}[1]{\mathrm{span}{#1}} \newcommand{\Div}{\operatorname{Div}} \newcommand{\Rot}{\operatorname{\mathbf{Rot}}} \newcommand{\Jac}{\operatorname{Jacobi}} \newcommand{\Tan}{\operatorname{Tan}} \newcommand{\Ort}{\operatorname{Ort}} \newcommand{\Flux}{\operatorname{Flux}} \newcommand{\Cmass}{\operatorname{Cm}} \newcommand{\Imom}{\operatorname{Im}} \newcommand{\Pmom}{\operatorname{Pm}} \newcommand{\IS}{\operatorname{I}} \newcommand{\IIS}{\operatorname{II}} \newcommand{\IIIS}{\operatorname{III}} \newcommand{\Le}{\operatorname{L}} \newcommand{\app}{\operatorname{app}} \newcommand{\M}{\operatorname{M}} \newcommand{\re}{\mathrm{Re}} \newcommand{\im}{\mathrm{Im}} \newcommand{\compl}{\mathbb{C}} \newcommand{\e}{\mathrm{e}} \\\\)

Exercise with focus on how eXogeneous input in the arima() R function works. Contains:

  1. Example: Investigate if arima() does fit a transfer function
  2. ARX model model for a transfer function
  3. Harmonic oscillation + noise
  4. Example: Linear trend + noise, using Arima from forecast package which automatically includes a slope

Paste the code into R and answer the following questions (the code part are maked with same numbers). Answers are below the code:

  • (1) Does an ARX model model a transfer function?
  • (2) Run with amplitude 5, how does the suggested ARIMA(0,1,0) validate?
  • (3) Try rerunning with amplitude 10 instead of 5, how does the suggested ARIMA(0,1,0) validate?
  • (4) For amplitude 10 what model would you try?
  • (5) Let us try to predict with this model?
  • (6) What happens when using the harmonics input model, which model would you prefer?

Code:

# ----------------------------------------------------------------
# Example, investigate if arima() does fit a transfer function

# Generate a step input
n <- 500
x <- c(rep(0,100), rep(1,n-100))
# Add a step
plot(x, type="s")

# Make an output vector "filtered" by the system: y_t = 0.98 * y_t + x_t
y <- filter(x,0.98,"recursive")
# Add AR noise
y <- y + c(arima.sim(list(ar=c(0.7,0,0)), n))
# Plot the output
plot(y)

# Try to model with arima
m1 <- arima(y, xreg=x, order=c(2,0,0))
m1
tsdiag(m1)

# Predict to see the predicted one-step output
pred1 <- predict(m1, newxreg=x, n.ahead = 1)
plot(pred1<span>$pred)
# There is no exponential response, so xreg is not included as a transfer function!

# Try to recreate the arima() with xreg is hard!
# Just LS directly, get parameters very different
lm(y ~ x)

# Conclusion:
# arima() does IN ONE GO: a linear model with xreg together with ARMA on residuals, 
# like e.g. ML estimation of ARMA(1,1) with one xreg: 
#   
#     (Y_t - beta_0 + x_t beta_1) = phi1 * (Y_{t-1} - beta_0 + x_{t-1} beta_1) + theta_0 eps_t + theta_1 eps_{t-1}
# 
# The parameters are estimated to minimize the squared residuals using an optimizer (so very close to maximum likelihood with normal distributed error)
# ----------------------------------------------------------------


# ----------------------------------------------------------------
# (1) ARX model model for a transfer function
# Make AR lags
y.l1 <- c(0,y[-n])
y.l2 <- c(0,y.l1[-n])

# Fit and one-step predictions with ARX(1)
arx1 <- lm(y ~ y.l1 + x)
summary(arx1)
plot(x, type="s")
plot(predict(arx1), type="l")
# ----------------------------------------------------------------


# ----------------------------------------------------------------
# Simulating some AR noise
set.seed(2)
noise <- arima.sim(model=list(ar=0.9), n = 300)
plot(noise)
# ----------------------------------------------------------------


# ----------------------------------------------------------------
# Harmonic oscillation + noise

# (2-3) Deterministic part with an amplitude:
amplitude <- 5
det <- amplitude * sin(0.1*(1:300)+1) + 2 
signal <- det + noise
plot(signal)
acf(signal) # Not stationary
acf(diff(signal)) # Looks like something odd creating a little correlation but no clear structure
(a1 <- arima(signal, order=c(0,1,0)))
# Validates?
tsdiag(a1) 
pacf(residuals(a1))
plot(residuals(a1))

# (4) Other model for amplitude 10
(a2 <- arima(signal, order=c(?,?,?)))
tsdiag(a2) # Looks good 

# (5) Let us try to predict with this model
plot(signal, xlim=c(0,400))
a2.pred <- predict(a2, n.ahead = 100)
matlines(301:400, a2.pred$</span>pred + 1.96*cbind(0, -a2.pred<span>$se, a2.pred$</span>se), col=2, lty=c(1,2,2))

# (6) Let us try a model using xreg with sin and cos with the true period
x <- cbind(sin = sin(0.1*(1:300)), cos = cos(0.1*(1:300)))
# We can fit a simple LM model:
lm1 <- lm(signal~x)
qqnorm(residuals(lm1)) # Looks fine
qqline(residuals(lm1))
summary(lm1) # All significant
acf(residuals(lm1)) # Ups - we should not trust the LM as residuals are correlated
pacf(residuals(lm1))
# Looks like AR(1)

# Using the same predictors and AR(1) structure for residuals
(a3 <- arima(signal, order=c(1,0,0), xreg = x, include.mean = TRUE))
tsdiag(a3) # Looks good

# Predict with harmonics model
plot(signal, xlim=c(0,400))
# We have to provide the xreg for the future
xpred <- cbind(sin = sin(0.1*(301:400)), cos = cos(0.1*(301:400)))
a3.pred <- predict(a3, n.ahead = 100, newxreg = xpred)
matlines(301:400, a2.pred<span>$pred + 1.96*cbind(0, -a2.pred$</span>se, a2.pred<span>$se), col=2, lty=c(1,2,2))
matlines(301:400, a3.pred$</span>pred + 1.96*cbind(0, -a3.pred<span>$se, a3.pred$</span>se), col=3, lty=c(1,2,2))
legend("bottomleft", legend = c("Using diff", "Using harmonic xreg"), lty=1, col=2:3, bg="white")
# ----------------------------------------------------------------


# ----------------------------------------------------------------
# Example: Linear trend + noise, using Arima from forecast package which automatically includes a slope
set.seed(2)
noise <- arima.sim(model=list(ar=0.9, ma=0.6), n = 300)
plot(noise)

det <- 0.05*(1:300+1) + 2
signal <- det + noise
plot(signal)
acf(signal) # Non stationary
acf(diff(signal)) 
pacf(diff(signal)) # More in PACF than ACF so maybe ARIMA(0,1,1)

a1 <- arima(signal, order=c(0,1,1))
tsdiag(a1) # Looks good
pacf(residuals(a1)) # Looks good
a1 # Note that you only estimate the ma1 parameter. There is no mean nor slope

# Predicting
plot(signal, xlim=c(0,400), ylim=c(-5,40))
# We have to provide the xreg for the future
a1.pred <- predict(a1, n.ahead = 100)
matlines(301:400, a1.pred<span>$pred + 1.96*cbind(0, -a1.pred$</span>se, a1.pred<span>$se), col=2, lty=c(1,2,2))
legend("bottomleft", legend = c("ARIMA(0,1,1)"), lty=1, col=2)
#Note that the prediction is a constant.
# 'arima' cannot estimate the slope of a trend without specifying it 

# The 'Arima' function from the forecast library can 'include.drift' (a slope)
library(forecast)
?Arima 
Arima # If you dig in you will see that it creates xreg ... see at the end

# Restarting with a simple linear regression (Same as lm(y~time))
a3 <- Arima(signal, order=c(0,0,0), include.drift = TRUE)
tsdiag(a3) # ACF is exponential
pacf(residuals(a3)) # Let us try an AR(1)

a4 <- Arima(signal, order=c(1,0,0), include.drift = TRUE)
tsdiag(a4) # Better but still something in lag 1
pacf(residuals(a4)) # Both lags 1 and 2 so try adding MA(1)

a5 <- Arima(signal, order=c(1,0,1), include.drift = TRUE)
tsdiag(a5) # Looks good
pacf(residuals(a5)) # Also good

# Fitting the same model using 'xreg' in 'arima'
a5b <- arima(signal, order=c(1,0,1), xreg = cbind(inter = 1, trend = 1:length(signal)), include.mean = FALSE)

# But let us try to predict with this model
plot(signal, xlim=c(0,400), ylim=c(-5,40))
# We have to provide the xreg for the future
lm.pred <- cbind(inter = 1, trend = (301:400))
a5b.pred <- predict(a5b, n.ahead = 100, newxreg = lm.pred)
matlines(301:400, a1.pred$</span>pred + 1.96*cbind(0, -a1.pred<span>$se, a1.pred$</span>se), col=2, lty=c(1,2,2))
matlines(301:400, a5b.pred<span>$pred + 1.96*cbind(0, -a5b.pred$</span>se, a5b.pred<span>$se), col=3, lty=c(1,2,2))
legend("topleft", legend = c("Using diff", "Using linear xreg"), lty=1, col=2:3)

Answers:

  • (1) Yes, it does, although cannot directly include MA part, it actually works very well in many practical applications
  • (2) Looks good for amplitude 5
  • (3) With an amplitude of 10 there are signals in both ACF and PACF
  • (4) ARIMA(1,1,1) gets a good validation
  • (5) Prediction converges to a constant and PI explodes
  • (6) The predictions using the “correct” xreg makes a much better model, but it doesn’t