Bioconductor Code: qmtools

Browse code

Added manual for poplin_reduce.

Jaehyun Joo authored on 30/11/2021 03:11:39
Showing 5 changed files

R/reduction-methods.R index 03ca879..242e8d4 100644
man/poplin_reduce.Rd index ba09103..532cc35 100644
man/poplin_reduce_pca.Rd index 0000000..1f70fab
man/poplin_reduce_plsda.Rd index 0000000..cb05f03
man/poplin_reduce_tsne.Rd index 0000000..90bb966

History View file @ ecaba5d

@@ -1,11 +1,36 @@
                      ##' Dimension reduction methods
                      ##'
                     +##' In metabolomics, dimension reduction methods are often used for modeling
                     +##' and visualization.
                     +##' [poplin_reduce] is a wrapper for the following set of functions:
                     +##' \describe{
                     +##' \item{\code{\link{poplin_reduce_pca}}:}{
                     +##' principal component analysis (PCA)
                     +##' }
                     +##' \item{\code{\link{poplin_reduce_plsda}}:}{
                     +##' partial least squares-discriminant analysis (PLS-DA)
                     +##' }
                     +##' \item{\code{\link{poplin_reduce_tsne}}:}{
                     +##' t-distributed stochastic neighbor embedding
                     +##' }
                     +##' }
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param method A dimension reduction method. Default is 'pca'.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param y A factor vector for discrete outcome required for PLS-DA. Ignored
                     +##'   otherwise.
                     +##' @param ncomp Output dimensionality.
                     +##' @param ... Argument passed to a specific dimension reduction method.
                     +##' @return A matrix or \linkS4class{poplin} object with the same number of rows
                     +##'   as \code{ncol(x)} containing the dimension reduction result.
                      ##' @name poplin_reduce
                     +##' @family data reduction methods
                      setMethod(
                        "poplin_reduce",
                        "matrix",
                     -  function(x, method, ...) {
                     -    .poplin_reduce(x, method = method, ...)
                     +  function(x, method = c("pca", "tsne", "plsda"), y, ncomp = 2, ...) {
                     +    .poplin_reduce(x, method = method, y = y, ncomp = ncomp, ...)
+                       }
+                     )
@@ -13,67 +38,154 @@ setMethod(
                      setMethod(
                        "poplin_reduce",
                        "poplin",
                     -  function(x, method, poplin_in, poplin_out, ...) {
                     +  function(x, method = c("pca", "tsne", "plsda"), poplin_in, poplin_out,
                     +           y, ncomp = 2, ...) {
                          m <- .verify_and_extract_input(x, poplin_in)
                     -    poplin_reduced(x, poplin_out) <- .poplin_reduce(m, method = method, ...)
                     +    poplin_reduced(x, poplin_out) <- .poplin_reduce(m, method = method, y = y,
                     +                                                    ncomp = ncomp, ...)
+                         x
+                       }
+                     )
                     -##' @rdname poplin_reduce
                     +##' Principal component analysis (PCA)
                     +##'
                     +##' Apply PCA to a matrix or \linkS4class{poplin} object. For the data without
                     +##' missing values, PCA is performed via a singular value decomposition.
                     +##' Otherwise, Bayesian PCA is performed using [pcaMethods::bpca] from the
                     +##' \pkg{pcaMethods} package. Note that Bayesian PCA does not force
                     +##' orthogonality between factor loadings.
                     +##'
                     +##' @references
                     +##' Shigeyuki Oba, Masa-aki Sato, Ichiro Takemasa, Morito Monden, Ken-ichi
                     +##' Matsubara, Shin Ishii, A Bayesian missing value estimation method for gene
                     +##' expression profile data, Bioinformatics, Volume 19, Issue 16, 1 November
                     +##' 2003, Pages 2088–2096, https://doi.org/10.1093/bioinformatics/btg287
                     +##'
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param ncomp Output dimensionality.
                     +##' @param center A logical indicating mean-centering prior to PCA.
                     +##' @param scale A logical indicating unit variance scaling prior to PCA.
                     +##' @param ... Additional arguments passed to [pcaMethods::bpca].
                     +##' @return A poplin.pca matrix or \linkS4class{poplin} object with the same
                     +##'   number of rows as \code{ncol(x)} containing the dimension reduction
                     +##'   result.
                     +##' @name poplin_reduce_pca
                     +##' @family data reduction methods
                      setMethod(
                        "poplin_reduce_pca",
                        "matrix",
                     -  function(x, ...) {
                     -    .poplin_impute_pca(x, ...)
                     +  function(x, ncomp = 2, center = TRUE, scale = FALSE, ...) {
                     +    .poplin_impute_pca(x, ncomp = ncomp, center = center, scale = scale, ...)
+                       }
+                     )
                     -##' @rdname poplin_reduce
                     +##' @rdname poplin_reduce_pca
                      setMethod(
                        "poplin_reduce_pca",
                        "poplin",
                     -  function(x, poplin_in, poplin_out, ...) {
                     +  function(x, poplin_in, poplin_out, ncomp = 2, center = 2, scale = FALSE, ...) {
                          .reduced_extract_and_assign(x, .poplin_reduce_pca,
                     -                               poplin_in, poplin_out, ...)
                     +                                poplin_in, poplin_out,
                     +                                ncomp = ncomp, center = center, scale = scale, ...)
+                       }
+                     )
                     -##' @rdname poplin_reduce
                     +##' t-distributed stochastic neighbor embedding (t-SNE)
                     +##'
                     +##' Apply t-SNE to a matrix or \linkS4class{poplin} object. This is an interface
                     +##' to the [Rtsne::Rtsne] from the \pkg{Rtsne} package. t-SNE is well-suited for
                     +##' visualizing high-dimensional data by giving each data point a location in a
                     +##' two or three-dimensional map.
                     +##'
                     +##' @references
                     +##'
                     +##' L.J.P. van der Maaten and G.E. Hinton. Visualizing High-Dimensional Data
                     +##' Using t-SNE. Journal of Machine Learning Research 9(Nov):2579-2605, 2008.
                     +##'
                     +##' L.J.P. van der Maaten. Accelerating t-SNE using Tree-Based Algorithms.
                     +##' Journal of Machine Learning Research 15(Oct):3221-3245, 2014.
                     +##'
                     +##' Jesse H. Krijthe (2015). Rtsne: T-Distributed Stochastic Neighbor Embedding
                     +##' using a Barnes-Hut Implementation, URL: https://github.com/jkrijthe/Rtsne
                     +##'
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param ncomp Number of components to calculate.
                     +##' @param normalize if \code{TRUE}, an input matrix is mean-centered and scaled
                     +##'   so that the largest absolute of the centered matrix is equal to unity. See
                     +##'   [Rtsne::normalize_input] for details.
                     +##' @param ... Additional argument passed to [Rtsne::Rtsne].
                     +##' @return A poplin.tsne matrix or \linkS4class{poplin} object with the same
                     +##'   number of rows as \code{ncol(x)} containing the dimension reduction
                     +##'   result.
                     +##' @name poplin_reduce_tsne
                     +##' @family data reduction methods
                      setMethod(
                        "poplin_reduce_tsne",
                        "matrix",
                     -  function(x, ...) {
                     -    .poplin_impute_tsne(x, ...)
                     +  function(x, ncomp = 2, normalize = TRUE, ...) {
                     +    .poplin_impute_tsne(x, ncomp = ncomp, normalize = normalize, ...)
+                       }
+                     )
                     -##' @rdname poplin_reduce
                     +##' @rdname poplin_reduce_tsne
                      setMethod(
                        "poplin_reduce_tsne",
                        "poplin",
                     -  function(x, poplin_in, poplin_out, ...) {
                     +  function(x, poplin_in, poplin_out, ncomp = 2, normalize = TRUE, ...) {
                          .reduced_extract_and_assign(x, .poplin_reduce_tsne,
                     -                                poplin_in, poplin_out, ...)
                     +                                poplin_in, poplin_out,
                     +                                ncomp = ncomp, normalize = normalize, ...)
+                       }
+                     )
                     -##' @rdname poplin_reduce
                     +##' Partial least squares-discriminant analysis (PLS-DA)
                     +##'
                     +##' Apply PLS-DA to a matrix or \linkS4class{poplin} object. It performs
                     +##' standard PLS for classification using [pls::plsr]. If the \pkg{pls} is not
                     +##' installed, this function will stop with a note about install the package.
                     +##'
                     +##' @references
                     +##'  Kristian Hovde Liland, Bjørn-Helge Mevik and Ron Wehrens (2021). pls:
                     +##'  Partial Least Squares and Principal Component Regression. R package version
                     +##'  2.8-0. https://CRAN.R-project.org/package=pls
                     +##'
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param method A dimension reduction method. Default is 'pca'.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param y A factor vector for discrete outcome.
                     +##' @param ncomp Output dimensionality.
                     +##' @param center A logical indicating mean-centering prior to PLS-DA.
                     +##' @param scale A logical indicating unit variance scaling prior to PLS-DA.
                     +##' @param ... Additional argument passed to [pls::plsr].
                     +##' @return A poplin.plsda matrix or \linkS4class{poplin} object with the same
                     +##'   number of rows as \code{ncol(x)} containing the dimension reduction
                     +##'   result.
                     +##' @name poplin_reduce_plsda
                     +##' @family data reduction methods
                      setMethod(
                        "poplin_reduce_plsda",
                        "matrix",
                     -  function(x, ...) {
                     -    .poplin_impute_plsda(x, ...)
                     +  function(x, y, ncomp = 2, center = TRUE, scale = FALSE, ...) {
                     +    .poplin_impute_plsda(x, y = y, ncomp = ncomp,
                     +                         center = center, scale = scale, ...)
+                       }
+                     )
                     -##' @rdname poplin_reduce
                     +##' @rdname poplin_reduce_plsda
                      setMethod(
                        "poplin_reduce_plsda",
                        "poplin",
                     -  function(x, poplin_in, poplin_out, ...) {
                     +  function(x, poplin_in, poplin_out, y,
                     +           ncomp = 2, center = TRUE, scale = FALSE, ...) {
                          .reduced_extract_and_assign(x, .poplin_reduce_plsda,
                     -                                poplin_in, poplin_out, ...)
                     +                                poplin_in, poplin_out,
                     +                                y = y, ncomp = ncomp,
                     +                                center = center, scale = scale, ...)
+                       }
+                     )

man/poplin_reduce.Rd

History View file @ ecaba5d

@@ -3,30 +3,60 @@
                      \name{poplin_reduce}
                      \alias{poplin_reduce}
                      \alias{poplin_reduce,poplin-method}
                     -\alias{poplin_reduce_pca,matrix-method}
                     -\alias{poplin_reduce_pca,poplin-method}
                     -\alias{poplin_reduce_tsne,matrix-method}
                     -\alias{poplin_reduce_tsne,poplin-method}
                     -\alias{poplin_reduce_plsda,matrix-method}
                     -\alias{poplin_reduce_plsda,poplin-method}
                      \title{Dimension reduction methods}
                      \usage{
                     -\S4method{poplin_reduce}{matrix}(x, method, ...)
                     +\S4method{poplin_reduce}{matrix}(x, method = c("pca", "tsne", "plsda"), y, ncomp = 2, ...)
                     -\S4method{poplin_reduce}{poplin}(x, method, poplin_in, poplin_out, ...)
                     +\S4method{poplin_reduce}{poplin}(
                     +  x,
                     +  method = c("pca", "tsne", "plsda"),
                     +  poplin_in,
                     +  poplin_out,
                     +  y,
                     +  ncomp = 2,
                     +  ...
                     +)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
                     -\S4method{poplin_reduce_pca}{matrix}(x, ...)
                     +\item{method}{A dimension reduction method. Default is 'pca'.}
                     -\S4method{poplin_reduce_pca}{poplin}(x, poplin_in, poplin_out, ...)
                     +\item{y}{A factor vector for discrete outcome required for PLS-DA. Ignored
                     +otherwise.}
                     -\S4method{poplin_reduce_tsne}{matrix}(x, ...)
                     +\item{ncomp}{Output dimensionality.}
                     -\S4method{poplin_reduce_tsne}{poplin}(x, poplin_in, poplin_out, ...)
                     +\item{...}{Argument passed to a specific dimension reduction method.}
                     -\S4method{poplin_reduce_plsda}{matrix}(x, ...)
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
                     -\S4method{poplin_reduce_plsda}{poplin}(x, poplin_in, poplin_out, ...)
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A matrix or \linkS4class{poplin} object with the same number of rows
                     +as \code{ncol(x)} containing the dimension reduction result.
+                     }
                      \description{
                     -Dimension reduction methods
                     +In metabolomics, dimension reduction methods are often used for modeling
                     +and visualization.
                     +\link{poplin_reduce} is a wrapper for the following set of functions:
                     +\describe{
                     +\item{\code{\link{poplin_reduce_pca}}:}{
                     +principal component analysis (PCA)
                     +}
                     +\item{\code{\link{poplin_reduce_plsda}}:}{
                     +partial least squares-discriminant analysis (PLS-DA)
                     +}
                     +\item{\code{\link{poplin_reduce_tsne}}:}{
                     +t-distributed stochastic neighbor embedding
                     +}
                     +}
                     +}
                     +\seealso{
                     +Other data reduction methods:
                     +\code{\link{poplin_reduce_pca}()},
                     +\code{\link{poplin_reduce_plsda}()},
                     +\code{\link{poplin_reduce_tsne}()}
+                     }
                     +\concept{data reduction methods}

man/poplin_reduce_pca.Rd

History View file @ ecaba5d

                     new file mode 100644
@@ -0,0 +1,59 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/reduction-methods.R
                     +\name{poplin_reduce_pca}
                     +\alias{poplin_reduce_pca}
                     +\alias{poplin_reduce_pca,poplin-method}
                     +\title{Principal component analysis (PCA)}
                     +\usage{
                     +\S4method{poplin_reduce_pca}{matrix}(x, ncomp = 2, center = TRUE, scale = FALSE, ...)
+                    +
                     +\S4method{poplin_reduce_pca}{poplin}(
                     +  x,
                     +  poplin_in,
                     +  poplin_out,
                     +  ncomp = 2,
                     +  center = 2,
                     +  scale = FALSE,
                     +  ...
                     +)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
+                    +
                     +\item{ncomp}{Output dimensionality.}
+                    +
                     +\item{center}{A logical indicating mean-centering prior to PCA.}
+                    +
                     +\item{scale}{A logical indicating unit variance scaling prior to PCA.}
+                    +
                     +\item{...}{Additional arguments passed to \link[pcaMethods:bpca]{pcaMethods::bpca}.}
+                    +
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
+                    +
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A poplin.pca matrix or \linkS4class{poplin} object with the same
                     +number of rows as \code{ncol(x)} containing the dimension reduction
                     +result.
                     +}
                     +\description{
                     +Apply PCA to a matrix or \linkS4class{poplin} object. For the data without
                     +missing values, PCA is performed via a singular value decomposition.
                     +Otherwise, Bayesian PCA is performed using \link[pcaMethods:bpca]{pcaMethods::bpca} from the
                     +\pkg{pcaMethods} package. Note that Bayesian PCA does not force
                     +orthogonality between factor loadings.
                     +}
                     +\references{
                     +Shigeyuki Oba, Masa-aki Sato, Ichiro Takemasa, Morito Monden, Ken-ichi
                     +Matsubara, Shin Ishii, A Bayesian missing value estimation method for gene
                     +expression profile data, Bioinformatics, Volume 19, Issue 16, 1 November
                     +2003, Pages 2088–2096, https://doi.org/10.1093/bioinformatics/btg287
                     +}
                     +\seealso{
                     +Other data reduction methods:
                     +\code{\link{poplin_reduce_plsda}()},
                     +\code{\link{poplin_reduce_tsne}()},
                     +\code{\link{poplin_reduce}()}
                     +}
                     +\concept{data reduction methods}

man/poplin_reduce_plsda.Rd

History View file @ ecaba5d

                     new file mode 100644
@@ -0,0 +1,61 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/reduction-methods.R
                     +\name{poplin_reduce_plsda}
                     +\alias{poplin_reduce_plsda}
                     +\alias{poplin_reduce_plsda,poplin-method}
                     +\title{Partial least squares-discriminant analysis (PLS-DA)}
                     +\usage{
                     +\S4method{poplin_reduce_plsda}{matrix}(x, y, ncomp = 2, center = TRUE, scale = FALSE, ...)
+                    +
                     +\S4method{poplin_reduce_plsda}{poplin}(
                     +  x,
                     +  poplin_in,
                     +  poplin_out,
                     +  y,
                     +  ncomp = 2,
                     +  center = TRUE,
                     +  scale = FALSE,
                     +  ...
                     +)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
+                    +
                     +\item{y}{A factor vector for discrete outcome.}
+                    +
                     +\item{ncomp}{Output dimensionality.}
+                    +
                     +\item{center}{A logical indicating mean-centering prior to PLS-DA.}
+                    +
                     +\item{scale}{A logical indicating unit variance scaling prior to PLS-DA.}
+                    +
                     +\item{...}{Additional argument passed to \link[pls:mvr]{pls::plsr}.}
+                    +
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
+                    +
                     +\item{poplin_out}{Name of a data matrix to store.}
+                    +
                     +\item{method}{A dimension reduction method. Default is 'pca'.}
                     +}
                     +\value{
                     +A poplin.plsda matrix or \linkS4class{poplin} object with the same
                     +number of rows as \code{ncol(x)} containing the dimension reduction
                     +result.
                     +}
                     +\description{
                     +Apply PLS-DA to a matrix or \linkS4class{poplin} object. It performs
                     +standard PLS for classification using \link[pls:mvr]{pls::plsr}. If the \pkg{pls} is not
                     +installed, this function will stop with a note about install the package.
                     +}
                     +\references{
                     +Kristian Hovde Liland, Bjørn-Helge Mevik and Ron Wehrens (2021). pls:
                     +Partial Least Squares and Principal Component Regression. R package version
                     +2.8-0. https://CRAN.R-project.org/package=pls
                     +}
                     +\seealso{
                     +Other data reduction methods:
                     +\code{\link{poplin_reduce_pca}()},
                     +\code{\link{poplin_reduce_tsne}()},
                     +\code{\link{poplin_reduce}()}
                     +}
                     +\concept{data reduction methods}

man/poplin_reduce_tsne.Rd

History View file @ ecaba5d

                     new file mode 100644
@@ -0,0 +1,54 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/reduction-methods.R
                     +\name{poplin_reduce_tsne}
                     +\alias{poplin_reduce_tsne}
                     +\alias{poplin_reduce_tsne,poplin-method}
                     +\title{t-distributed stochastic neighbor embedding (t-SNE)}
                     +\usage{
                     +\S4method{poplin_reduce_tsne}{matrix}(x, ncomp = 2, normalize = TRUE, ...)
+                    +
                     +\S4method{poplin_reduce_tsne}{poplin}(x, poplin_in, poplin_out, ncomp = 2, normalize = TRUE, ...)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
+                    +
                     +\item{ncomp}{Number of components to calculate.}
+                    +
                     +\item{normalize}{if \code{TRUE}, an input matrix is mean-centered and scaled
                     +so that the largest absolute of the centered matrix is equal to unity. See
                     +\link[Rtsne:normalize_input]{Rtsne::normalize_input} for details.}
+                    +
                     +\item{...}{Additional argument passed to \link[Rtsne:Rtsne]{Rtsne::Rtsne}.}
+                    +
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
+                    +
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A poplin.tsne matrix or \linkS4class{poplin} object with the same
                     +number of rows as \code{ncol(x)} containing the dimension reduction
                     +result.
                     +}
                     +\description{
                     +Apply t-SNE to a matrix or \linkS4class{poplin} object. This is an interface
                     +to the \link[Rtsne:Rtsne]{Rtsne::Rtsne} from the \pkg{Rtsne} package. t-SNE is well-suited for
                     +visualizing high-dimensional data by giving each data point a location in a
                     +two or three-dimensional map.
                     +}
                     +\references{
                     +L.J.P. van der Maaten and G.E. Hinton. Visualizing High-Dimensional Data
                     +Using t-SNE. Journal of Machine Learning Research 9(Nov):2579-2605, 2008.
+                    +
                     +L.J.P. van der Maaten. Accelerating t-SNE using Tree-Based Algorithms.
                     +Journal of Machine Learning Research 15(Oct):3221-3245, 2014.
+                    +
                     +Jesse H. Krijthe (2015). Rtsne: T-Distributed Stochastic Neighbor Embedding
                     +using a Barnes-Hut Implementation, URL: https://github.com/jkrijthe/Rtsne
                     +}
                     +\seealso{
                     +Other data reduction methods:
                     +\code{\link{poplin_reduce_pca}()},
                     +\code{\link{poplin_reduce_plsda}()},
                     +\code{\link{poplin_reduce}()}
                     +}
                     +\concept{data reduction methods}