📄 simpls.fit.r

📁 做主成分回归和偏最小二乘回归
💻 R
字号:
### simpls.fit.R: SimPLS fit algorithm.### $Id: simpls.fit.R 133 2007-08-24 09:21:56Z bhm $###### Implements an adapted version of the SIMPLS algorithm described in###   de Jong, S. (1993) SIMPLS: an alternative approach to partial least###   squares regression.  \emph{Chemometrics and Intelligent Laboratory###   Systems}, \bold{18}, 251--263.simpls.fit <- function(X, Y, ncomp, stripped = FALSE, ...){    Y <- as.matrix(Y)    if (!stripped) {        ## Save dimnames:        dnX <- dimnames(X)        dnY <- dimnames(Y)    }    ## Remove dimnames during calculation (doesn't seem to matter; in fact,    ## as far as it has any effect, it hurts a tiny bit in most situations).    dimnames(X) <- dimnames(Y) <- NULL    nobj <- dim(X)[1] # n in paper    npred <- dim(X)[2] # p in paper    nresp <- dim(Y)[2]    V <- R <- matrix(0, nrow = npred, ncol = ncomp)    tQ <- matrix(0, nrow = ncomp, ncol = nresp) # Y loadings; transposed    B <- array(0, dim = c(npred, nresp, ncomp))    if (!stripped) {        P <- R        U <- TT <- matrix(0, nrow = nobj, ncol = ncomp)        fitted <- array(0, dim = c(nobj, nresp, ncomp))    }    ## Center variables:    Xmeans <- colMeans(X)    X <- X - rep(Xmeans, each = nobj)   # This is not strictly neccessary                                        # (but might be good for accuracy?)!    Ymeans <- colMeans(Y)    Y <- Y - rep(Ymeans, each = nobj)    S <- crossprod(X, Y)    for (a in 1:ncomp) {        ## A more efficient way of calculating the Y block factor weights        ## q.a <- svd(S)$v[,1]:        if (nresp == 1) {            q.a <- 1        } else {            if (nresp < npred) {                q.a <- eigen(crossprod(S), symmetric = TRUE)$vectors[,1]            } else {                q.a <- c(crossprod(S, eigen(S %*% t(S),                                            symmetric = TRUE)$vectors[,1]))                q.a <- q.a / sqrt(c(crossprod(q.a)))            }        }        r.a <- S %*% q.a                 # X block factor weights        t.a <- X %*% r.a        t.a <- t.a - mean(t.a)           # center scores        tnorm <- sqrt(c(crossprod(t.a)))        t.a <- t.a / tnorm               # normalize scores        r.a <- r.a / tnorm               # adapt weights accordingly        p.a <- crossprod(X, t.a)         # X block factor loadings        q.a <- crossprod(Y, t.a)         # Y block factor loadings        v.a <- p.a			 # init orthogonal loadings        if (a > 1) {            v.a <- v.a - V %*% crossprod(V, p.a) # v.a orth to previous loadings        }        v.a <- v.a / sqrt(c(crossprod(v.a))) # normalize orthogonal loadings        S <- S - v.a %*% crossprod(v.a, S) # deflate S        R[,a] <- r.a        tQ[a,] <- q.a        V[,a] <- v.a        B[,,a] <- R[,1:a, drop=FALSE] %*% tQ[1:a,, drop=FALSE]        if (!stripped) {            u.a <- Y %*% q.a # Y block factor scores            if (a > 1)                u.a <- u.a - TT %*% crossprod(TT, u.a) # u.a orth to previous t.a values            P[,a] <- p.a            TT[,a] <- t.a            U[,a] <- u.a            ## (For very tall, slim X and Y, X %*% B[,,a] is slightly faster,            ## due to less overhead.)            fitted[,,a] <- TT[,1:a] %*% tQ[1:a,, drop=FALSE]        }    }    if (stripped) {        ## Return as quickly as possible        list(coefficients = B, Xmeans = Xmeans, Ymeans = Ymeans)    } else {        residuals <- - fitted + c(Y)        fitted <- fitted + rep(Ymeans, each = nobj) # Add mean        ## Add dimnames and classes:        objnames <- dnX[[1]]        if (is.null(objnames)) objnames <- dnY[[1]]        prednames <- dnX[[2]]        respnames <- dnY[[2]]        compnames <- paste("Comp", 1:ncomp)        nCompnames <- paste(1:ncomp, "comps")        dimnames(TT) <- dimnames(U) <- list(objnames, compnames)        dimnames(R) <- dimnames(P) <- list(prednames, compnames)        dimnames(tQ) <- list(compnames, respnames)        dimnames(B) <- list(prednames, respnames, nCompnames)        dimnames(fitted) <- dimnames(residuals) <-            list(objnames, respnames, nCompnames)        class(TT) <- class(U) <- "scores"        class(P) <- class(tQ) <- "loadings"        list(coefficients = B,             scores = TT, loadings = P,             Yscores = U, Yloadings = t(tQ),             projection = R,             Xmeans = Xmeans, Ymeans = Ymeans,             fitted.values = fitted, residuals = residuals,             Xvar = colSums(P * P), Xtotvar = sum(X * X))    }}
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -