📄 oscorespls.fit.r

📁 做主成分回归和偏最小二乘回归
💻 R
字号:
### oscorespls.fit.R: The multiresponse orthogonal scores algorithm###### $Id: oscorespls.fit.R 133 2007-08-24 09:21:56Z bhm $###### Implements an adapted version of the `orthogonal scores' algorithm as###   described in Martens and Naes, pp. 121--122 and 157--158.oscorespls.fit <- function(X, Y, ncomp, stripped = FALSE,                           tol = .Machine$double.eps^0.5, ...){    ## Initialise    Y <- as.matrix(Y)    if (!stripped) {        ## Save dimnames        dnX <- dimnames(X)        dnY <- dimnames(Y)    }    ## Remove dimnames for performance (doesn't seem to matter; in fact,    ## as far as it has any effect, it hurts a tiny bit in most situations.    dimnames(X) <- dimnames(Y) <- NULL    nobj <- dim(X)[1]    npred <- dim(X)[2]    nresp <- dim(Y)[2]    W <- P <- matrix(0, nrow = npred, ncol = ncomp)    tQ <- matrix(0, nrow = ncomp, ncol = nresp) # Y loadings; transposed    B <- array(0, dim = c(npred, nresp, ncomp))    if (!stripped) {        TT <- U <- matrix(0, nrow = nobj, ncol = ncomp)        tsqs <- numeric(ncomp)          # t't        fitted <- residuals <- array(0, dim = c(nobj, nresp, ncomp))    }    ## C1    Xmeans <- colMeans(X)    X <- X - rep(Xmeans, each = nobj)    Ymeans <- colMeans(Y)    Y <- Y - rep(Ymeans, each = nobj)    ## Must be done here due to the deflation of X    if (!stripped) Xtotvar <- sum(X * X)    for(a in 1:ncomp) {        ## Initial values:        if (nresp == 1) {               # pls1            u.a <- Y                    # FIXME: scale?        } else {                        # pls2            ## The coloumn of Y with largest sum of squares:            u.a <- Y[,which.max(colSums(Y * Y))]            t.a.old <- 0        }        repeat {            ## C2.1            w.a <- crossprod(X, u.a)            w.a <- w.a / sqrt(c(crossprod(w.a)))            ## C2.2            t.a <- X %*% w.a            ## C2.3            tsq <- c(crossprod(t.a))            t.tt <- t.a / tsq            ## C2.4            q.a <- crossprod(Y, t.tt)            if (nresp == 1)                break                   # pls1: no iteration            ## C2.4b-c            ## Convergence check for pls2:            if (sum(abs((t.a - t.a.old) / t.a), na.rm = TRUE) < tol)                break            else {                u.a <- Y %*% q.a / c(crossprod(q.a))                t.a.old <- t.a          # Save for comparison            }        }        ## C2.3 contd.        p.a <- crossprod(X, t.tt)        ## C2.5        X <- X - t.a %*% t(p.a)        Y <- Y - t.a %*% t(q.a)        ## Save scores etc:        W[,a] <- w.a        P[,a] <- p.a        tQ[a,] <- q.a        if (!stripped) {            TT[,a] <- t.a            U[,a] <- u.a            tsqs[a] <- tsq            ## (For very tall, slim X and Y, X0 %*% B[,,a] is slightly faster,            ## due to less overhead.)            fitted[,,a] <- TT[,1:a] %*% tQ[1:a,, drop=FALSE]            residuals[,,a] <- Y        }    }    ## Calculate rotation matrix:    if (ncomp == 1) {        ## For 1 component, R == W:        R <- W    } else {        PW <- crossprod(P, W)        ## It is known that P^tW is right bi-diagonal (one response) or upper        ## triangular (multiple responses), with all diagonal elements equal to 1.        if (nresp == 1) {            ## For single-response models, direct calculation of (P^tW)^-1 is            ## simple, and faster than using backsolve.            PWinv <- diag(ncomp)            bidiag <- - PW[row(PW) == col(PW)-1]            for (a in 1:(ncomp - 1))                PWinv[a,(a+1):ncomp] <- cumprod(bidiag[a:(ncomp-1)])        } else {            PWinv <- backsolve(PW, diag(ncomp))        }    R <- W %*% PWinv    }    ## Calculate regression coefficients:    for (a in 1:ncomp) {        B[,,a] <- R[,1:a, drop=FALSE] %*% tQ[1:a,, drop=FALSE]    }    if (stripped) {        ## Return as quickly as possible        list(coefficients = B, Xmeans = Xmeans, Ymeans = Ymeans)    } else {        fitted <- fitted + rep(Ymeans, each = nobj) # Add mean        ## Add dimnames and classes:        objnames <- dnX[[1]]        if (is.null(objnames)) objnames <- dnY[[1]]        prednames <- dnX[[2]]        respnames <- dnY[[2]]        compnames <- paste("Comp", 1:ncomp)        nCompnames <- paste(1:ncomp, "comps")        dimnames(TT) <- dimnames(U) <- list(objnames, compnames)        dimnames(R) <- dimnames(W) <- dimnames(P) <-            list(prednames, compnames)        dimnames(tQ) <- list(compnames, respnames)        dimnames(B) <- list(prednames, respnames, nCompnames)        dimnames(fitted) <- dimnames(residuals) <-            list(objnames, respnames, nCompnames)        class(TT) <- class(U) <- "scores"        class(P) <- class(W) <- class(tQ) <- "loadings"        list(coefficients = B,             scores = TT, loadings = P,             loading.weights = W,             Yscores = U, Yloadings = t(tQ),             projection = R,             Xmeans = Xmeans, Ymeans = Ymeans,             fitted.values = fitted, residuals = residuals,             Xvar = colSums(P * P) * tsqs,             Xtotvar = Xtotvar)    }}
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -