📄 widekernelpls.fit.r

📁 做主成分回归和偏最小二乘回归
💻 R
字号:
### widekernelpls.fit.R: Kernel PLS fit algorithm for wide data.### $Id: widekernelpls.fit.R 138 2007-09-28 15:24:29Z bhm $###### Implements an adapted version of the algorithm described in###  Rannar, S., Lindgren, F., Geladi, P. and Wold, S. (1994) A PLS###  Kernel Algorithm for Data Sets with Many Variables and Fewer###  Objects.  Part 1: Theory and Algorithm.###  \emph{Journal of Chemometrics}, \bold{8}, 111--125.widekernelpls.fit <- function(X, Y, ncomp, stripped = FALSE,                              tol = .Machine$double.eps^0.5,                              maxit = 100, ...){    ## Initialise    Y <- as.matrix(Y)    if(!stripped) {        ## Save dimnames:        dnX <- dimnames(X)        dnY <- dimnames(Y)    }    ## Remove dimnames during calculation.    dimnames(X) <- dimnames(Y) <- NULL    nobj <- dim(X)[1]    npred <- dim(X)[2]    nresp <- dim(Y)[2]    TT <- U <- matrix(0, ncol = ncomp, nrow = nobj)# scores    B <- array(0, c(npred, nresp, ncomp))    In <- diag(nobj)    nits <- numeric(ncomp)              # for debugging    if (!stripped) {        fitted <- array(0, dim = c(nobj, nresp, ncomp))        Xresvar <- numeric(ncomp)    }    ## Center variables:    Xmeans <- colMeans(X)    X <- X - rep(Xmeans, each = nobj)    Ymeans <- colMeans(Y)    Y <- Y - rep(Ymeans, each = nobj)    XXt <- tcrossprod(X)    YYt <- tcrossprod(Y)    if (!stripped) Xtotvar <- sum(diag(XXt))    for (a in 1:ncomp) {        XXtYYt <- XXt %*% YYt        ## This avoids problems with negative eigenvalues due to roundoff        ## errors in zero rank cases, and can potentionally give slightly        ## faster and/or more accurate results:        XXtYYt <- XXtYYt %*% XXtYYt        ## Initial values:        t.a.old <- Y[,1]        nit <- 0                        # for debugging        repeat {            nit <- nit + 1              # for debugging            t.a <- XXtYYt %*% t.a.old            t.a <- t.a / sqrt(c(crossprod(t.a)))            if (sum(abs((t.a - t.a.old) / t.a), na.rm = TRUE) < tol)                break            else                t.a.old <- t.a            if (nit >= maxit) {         # for debugging              warning("No convergence in", maxit, "iterations\n")              break            }        }        nits[a] <- nit                  # for debugging        u.a <- YYt %*% t.a        utmp <- u.a / c(crossprod(t.a, u.a))        wpw <- sqrt(c(crossprod(utmp, XXt) %*% utmp))        TT[,a] <- t.a * wpw        U[,a] <- utmp * wpw        G <- In - tcrossprod(t.a)        XXt <- G %*% XXt %*% G        YYt <- G %*% YYt %*% G        if (!stripped) Xresvar[a] <- sum(diag(XXt))    }    W <- crossprod(X, U)    W <- W / rep(sqrt(colSums(W * W)), each = npred)    TTtTinv <- TT %*% diag(1 / colSums(TT * TT))    P <- crossprod(X, TTtTinv)    Q <- crossprod(Y, TTtTinv)    ## Calculate rotation matrix:    if (ncomp == 1) {        ## For 1 component, R == W:        R <- W    } else {        PW <- crossprod(P, W)        ## It is known that P^tW is right bi-diagonal (one response) or upper        ## triangular (multiple responses), with all diagonal elements equal to 1.        if (nresp == 1) {            ## For single-response models, direct calculation of (P^tW)^-1 is            ## simple, and faster than using backsolve.            PWinv <- diag(ncomp)            bidiag <- - PW[row(PW) == col(PW)-1]            for (a in 1:(ncomp - 1))                PWinv[a,(a+1):ncomp] <- cumprod(bidiag[a:(ncomp-1)])        } else {            PWinv <- backsolve(PW, diag(ncomp))        }        R <- W %*% PWinv    }    ## Calculate regression coefficients:    for (a in 1:ncomp) {        B[,,a] <- tcrossprod(R[,1:a, drop=FALSE], Q[,1:a, drop=FALSE])    }    if (stripped) {        ## Return as quickly as possible        list(coefficients = B, Xmeans = Xmeans, Ymeans = Ymeans)    } else {        ## Fitted values, residuals etc:        for (a in 1:ncomp)            fitted[,,a] <- tcrossprod(TT[,1:a, drop=FALSE], Q[,1:a, drop=FALSE])        residuals <- - fitted + c(Y)        fitted <- fitted + rep(Ymeans, each = nobj) # Add mean        Xvar <- diff(-c(Xtotvar, Xresvar))        ## Add dimnames:        objnames <- dnX[[1]]        if (is.null(objnames)) objnames <- dnY[[1]]        prednames <- dnX[[2]]        respnames <- dnY[[2]]        compnames <- paste("Comp", 1:ncomp)        nCompnames <- paste(1:ncomp, "comps")        dimnames(TT) <- dimnames(U) <- list(objnames, compnames)        dimnames(R) <- dimnames(W) <- dimnames(P) <-            list(prednames, compnames)        dimnames(Q) <- list(respnames, compnames)        dimnames(B) <- list(prednames, respnames, nCompnames)        dimnames(fitted) <- dimnames(residuals) <-            list(objnames, respnames, nCompnames)        names(Xvar) <- compnames        class(TT) <- class(U) <- "scores"        class(P) <- class(W) <- class(Q) <- "loadings"        list(coefficients = B,             scores = TT, loadings = P,             loading.weights = W,             Yscores = U, Yloadings = Q,             projection = R,             Xmeans = Xmeans, Ymeans = Ymeans,             fitted.values = fitted, residuals = residuals,             Xvar = Xvar, Xtotvar = Xtotvar,             nits = nits)               # for debugging    }}
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -