LFS_model.R

# This R-script is party based on "An Introduction to State Space Models" by Marc Wildi.

# The function "LFS_univ" performs the estimation of the LFS model, without auxiliary series. It requires the following arguments:
# par: initial values for the model's parameters (9x1 vector).
# y: 5xT matrix of the unemployed labour force (T=185).
# opti: if TRUE, optimizes the function.
# k: Tx5 matrix of the standard errors of the GREG estimates.
# outofsample: if TRUE, computes the log-likelihood based on the out-of-sample forecast errors.
# parP10: large number for the diffuse initialization.
# nstates: number of state variables in the model.

# Packages required to run the scripts:
library(magic)
library(ucminf)


is.scalar <- function(x) is.atomic(x) && length(x) == 1L


LFS_univ <- function(par,y,opti,k,outofsample,parP10,nstates){
    
  len <- length(y[1,])      # sample size.
  sigma_Ry <- par[1]      # variance of the slope's innovation.
  sigma_omegay <- par[2]      # variance of the seasonal component's innovation.
  sigma_lambda <- par[3]      # variance of the RGB component's innovation.
  sd_nu <- diag(exp(c(par[4], par[5], par[6], par[7], par[8])), 5,5)        # covariance matrix of the survey errors' innovations.
  x10 <- rep(0,nstates)
  Pttm1 <- lapply(seq_len(len+1), function(X) matrix(0,nstates,nstates))      # list to store the estimated state variances.
  Ptt <- lapply(seq_len(len), function(X) matrix(0,nstates,nstates))      # list to store the updated state variances' estimates.
  delta <- par[9]      # autocorrelation parameter of the survey errors.
  P10 <- diag(c(rep(parP10[1],17),c(1,rep((1-delta^2),4),1,rep((1-delta^2),3),1,rep((1-delta^2),3)),rep(parP10[1],nstates-30)),nstates,nstates)     
  Pttm1[[1]] <- P10      # initialization of the state variances.
  xtt <- matrix(0,nstates,(len))     # matrix to store the updated state variables' estimates.
  xttm1 <- matrix(0,nstates,(len+1))    # matrix to store the estimated state variables.
  xttm1[,1] <- x10      # initialization of the state variables.
  R <- diag(1,nstates,nstates)
  D <- adiag(0, exp(sigma_Ry), exp(sigma_omegay)*diag(11), exp(sigma_lambda)*diag(4), sd_nu, diag(0,8,8))
  Q <- D%*%R%*%D      # states innovations' covariance matrix.  
  
  # Bulid T (the tranistion matrix):
  Tymu <- matrix(c(1,1,0,1),2,2, byrow=T)      # transition matrix of the trend's level and slope.
  C <- array(0,dim=c(2,2,5))
  for (l in 1:5){
    C[,,l] <- matrix(c(cos((pi*l)/6),  sin((pi*l)/6), -sin((pi*l)/6), cos((pi*l)/6)),2,2,byrow=TRUE)
  }
  Tyomega <- adiag(C[,,1],C[,,2],C[,,3],C[,,4],C[,,5],-1)      # transition matrix of the seasonal component.
  Tylambda <- diag(4)      # transition matrix of the RGB component.
  TyE <- rbind(matrix(0,9,5), cbind(diag(4), c(0,0,0,0)))      # transition matrix of the survey errors component.
  TyE <- cbind(TyE, rbind(c(0,0,0,0),diag(delta,nrow=4,ncol=4),matrix(0,8,4)))
  TyE <- cbind(TyE, rbind(matrix(0,5,4),diag(4),matrix(0,4,4)))
  Ty <- adiag(Tymu, Tyomega, Tylambda, TyE)
  Tmatrix <- Ty
  
  # initialization of log-likelihood:
  logl <- 0
  
  # Start of KF recursions:
  for (i in 1:len){
    
    # Bulid Z:
    Zy <- c(1,0)
    Zy <- rep(Zy,6)
    Zy <- c(Zy,1)
    Zy <- rbind(Zy,Zy,Zy,Zy,Zy)
    Zy <- cbind(Zy,rbind(c(0,0,0,0),diag(4)))
    Zy <- cbind(Zy, diag(as.numeric(k[i,]), nrow=5, ncol=5), matrix(0, nrow=5, ncol=8))
    Z <- Zy
    ncol(Z)
    nrow(Z)
    
    W <- diag(1,length(y[,i]))     # matrix to treat missing observations.
    if (length(which(is.na(y[,i]))) > 0 && length(which(is.na(y[,i]))) < length(y[,i])){      # some, but not all, variables have have missing observations in i.
      W <- matrix(W[-which(is.na(y[,i])),], nrow=(length(y[,i])-length(which(is.na(y[,i])))), ncol=ncol(W))
      Z <- W%*%Z
      y[which(is.na(y[,i])),i] <- 0
    }
    
    if (length(which(is.na(y[,i]))) > 0 && length(which(is.na(y[,i]))) == length(y[,i])){     # all series have missing observations in i.     
      xtt[,i] <- xttm1[,i]
      Ptt[[i]] <- Pttm1[[i]]
      Pttm1[[i+1]] <- Tmatrix%*%Pttm1[[i]]%*%t(Tmatrix) + Q
      xttm1[,i+1] <- Tmatrix%*%xttm1[,i]      
    } else {     
      epshatoutofsample <- W%*%y[,i] - Z%*%xttm1[,i]      # out-of-sample forecas errors.
      Fmatrix <- Z%*%Pttm1[[i]]%*%t(Z)
      if (is.scalar(Fmatrix) == TRUE){
        Fmatrix.inv = 1/Fmatrix
      } else {
        svdFmatrix <- svd(Fmatrix)
        Fmatrix.inv <- svdFmatrix$v%*%diag(1/svdFmatrix$d)%*%t(svdFmatrix$u)
      }
      Kg <- Tmatrix%*%Pttm1[[i]]%*%t(Z)%*%Fmatrix.inv      # Kalman gain.
      xtt[,i] <- xttm1[,i]+Pttm1[[i]]%*%t(Z)%*%Fmatrix.inv%*%epshatoutofsample       # compute updated estimates of the state variables.
      epshatinsample <- W%*%y[,i]-Z%*%xtt[,i]      # in-sample forecast errors (after y_t has been observed).
      Ptt[[i]] <- Pttm1[[i]]-Pttm1[[i]]%*%t(Z)%*%Fmatrix.inv%*%Z%*%Pttm1[[i]]       # compute updated estimates of the state variables' covariance matrix.
      Pttm1[[i+1]] <- Tmatrix%*%Pttm1[[i]]%*%t(Tmatrix-Kg%*%Z)+Q      # compute one-step-ahead forecasts of the state variables' covariance matrix.
      xttm1[,i+1] <- Tmatrix%*%xttm1[,i] + Kg%*%epshatoutofsample      # compute one-step-ahead forecasts of the state variables.
        
    }
    
    # The optimization criterion
    if (outofsample) {
      if (i <= (30-13) ){      # 30-13 is the number of state variables for which a diffuse initialization is employed.
        logl <- logl - nrow(y)/2*log(2*pi)
      } else if (i > (30-13) ){      # diffuse log-likelihood.
        logl <- logl - nrow(y)/2*log(2*pi) - 1/2*log(det(Fmatrix)) - 1/2*t(epshatoutofsample)%*%Fmatrix.inv%*%epshatoutofsample
        if ((NaN %in% logl)==T){       # push the log-likelihood away from the current parameters if there are NaN values in the log-likelihood.
          logl<- -P10[1]
        }
      }
    } else {
      if (i <= (30-13) ){
        logl <- logl - nrow(y)/2*log(2*pi)
      } else if (i > (30-13) ){      
        logl <- logl - nrow(y)/2*log(2*pi) - 1/2*log(det(Fmatrix)) - 1/2*t(epshatinsample)%*%Fmatrix.inv%*%epshatinsample
        if ((NaN %in% logl)==T){
          logl<- -P10[1]
        }
      }
    }
  }
  if (opti) {
    return(-logl)
  }
  else {
    return(list(logl=-logl, xtt=xtt,xttm1=xttm1,Pttm1=Pttm1,Ptt=Ptt))
  }
}
                
                
objopt <- ucminf(par=c(log(2000),log(0.02),log(900),log(1.07),log(0.99*(1-0.21^2)),
                 log(1.01*(1-0.21^2)),log(1.13*(1-0.21^2)),log(1.06*(1-0.21^2)), 0.21),
                 LFS_univ,y,k,opti=T,outofsample=T,parP10=1000000000000,nstates=30,hessian=2, 
                 control=list(grad="central", gradstep = c(1e-2, 1e-3)))      # optimize the function.
                
par <- objopt$par      # estimated hperparameters.
                
obj <- LFS_univ(par=objopt$par,y,k,opti=F,outofsample=T,parP10=1000000000000,nstates=30)      # Kalman filter estimation.