Bioconductor Code: qmtools

Browse code

Added manual for poplin_impute.

Jaehyun Joo authored on 29/11/2021 05:59:07
Showing 12 changed files

NAMESPACE index 6f819ab..940bd66 100644
R/AllGenerics.R index be2db66..3b8f71b 100644
R/imputation-functions.R index d871e12..3fe299b 100644
R/imputation-methods.R index 371fc92..595ecc5 100644
R/normalization-functions.R index 2af2a22..da0a81a 100644
R/normalization-methods.R index c2477a6..a999298 100644
man/poplin_impute.Rd index 8392947..fb898da 100644
man/poplin_impute_knn.Rd index 0000000..cd25fe8
man/poplin_impute_pca.Rd index 0000000..d099d45
man/poplin_impute_randomforest.Rd index 0000000..ede6a9f
man/poplin_impute_simple.Rd index 0000000..538674a
man/poplin_normalize_pqn.Rd index c8dc607..950c8e5 100644

History View file @ 492d166

@@ -64,6 +64,7 @@ export(poplin_impute_mean)
                      export(poplin_impute_median)
                      export(poplin_impute_pca)
                      export(poplin_impute_randomforest)
                     +export(poplin_impute_simple)
                      export(poplin_naplot)
                      export(poplin_normalize)
                      export(poplin_normalize_auto)

R/AllGenerics.R

History View file @ 492d166

@@ -231,6 +231,12 @@ setGeneric(
                        function(x, ...) standardGeneric("poplin_impute_mean")
+                     )
                     +##' @export
                     +setGeneric(
                     +  "poplin_impute_simple",
                     +  function(x, ...) standardGeneric("poplin_impute_simple")
                     +)
+                    +
                      ##' @export
                      setGeneric(
                        "poplin_impute_pca",

R/imputation-functions.R

History View file @ 492d166

@@ -1,19 +1,64 @@
                      .poplin_impute <- function(x,
                     -                           method = c("knn", "halfmin", "median",
                     -                                      "mean", "pca", "randomforest"),
                     +                           method = c("knn", "randomforest", "pca", "simple"),
                                                 ...) {
                        method <- match.arg(method)
                        switch(
                          method,
                          knn = .poplin_impute_knn(x, ...),
                     -    halfmin = .poplin_impute_halfmin(x, ...),
                     -    median = .poplin_impute_median(x, ...),
                     -    mean = .poplin_impute_mean(x, ...),
                     -    pca = .poplin_impute_pca(x, ...),
                          randomforest = .poplin_impute_randomforest(x, ...),
                     +    pca = .poplin_impute_pca(x, ...),
                     +    ## halfmin = .poplin_impute_halfmin(x, ...),
                     +    ## median = .poplin_impute_median(x, ...),
                     +    ## mean = .poplin_impute_mean(x, ...),
                     +    simple = .poplin_impute_simple(x, ...)
+                         )
+                     }
                     +## Knn imputation
                     +.poplin_impute_knn <- function(x, by = c("feature", "sample"), ...) {
                     +  if (!requireNamespace("VIM", quietly = TRUE)) {
                     +    stop("Package 'VIM' is required. Please install and try again.")
                     +  }
                     +  by <- match.arg(by)
                     +  if (by == "feature") {
                     +    out <- VIM::kNN(x, ...)[, 1:ncol(x)]
                     +    ## VIM package internally converts x as data.table, which drops rownames
                     +    rownames(out) <- rownames(x)
                     +  } else {
                     +    out <- t(VIM::kNN(t(x), ...))[1:nrow(x), ]
                     +    colnames(out) <- colnames(x)
                     +  }
                     +  as.matrix(out)
                     +}
+                    +
                     +## Random forest imputation
                     +.poplin_impute_randomforest <- function(x, ...) {
                     +  if (!requireNamespace("missForest", quietly = TRUE)) {
                     +    stop("Package 'missForest' is required. Please install and try again.")
                     +  }
                     +  t(missForest::missForest(t(x), ...)$ximp)
                     +}
+                    +
                     +## Bayesian PCA imputation
                     +.poplin_impute_pca <- function(x, type = c("bpca", "ppca", "nipals", "svdImpute"), ...) {
                     +  if (!requireNamespace("pcaMethods", quietly = TRUE)) {
                     +    stop("Package 'pcaMethods' is required. Please install and try again.")
                     +  }
                     +  type <- match.arg(type)
                     +  t(pcaMethods::pca(t(x), method = type, ...)@completeObs)
                     +}
+                    +
                     +## Simple univariate imputation
                     +.poplin_impute_simple <- function(x, type = c("halfmin", "median", "mean")) {
                     +  type <- match.arg(type)
                     +  switch(
                     +    type,
                     +    halfmin = .poplin_impute_halfmin(x),
                     +    median = .poplin_impute_median(x),
                     +    mean = .poplin_impute_mean(x)
                     +  )
                     +}
+                    +
                      .poplin_impute_halfmin <- function(x) {
                        out <- apply(x, 1, function(x) {
                          if (anyNA(x)) {
@@ -46,33 +91,3 @@
                        })
                        t(out)
+                     }
+                    -
                     -.poplin_impute_knn <- function(x, by = c("feature", "sample"), ...) {
                     -  if (!requireNamespace("VIM", quietly = TRUE)) {
                     -    stop("Package 'VIM' is required. Please install and try again.")
                     -  }
                     -  by <- match.arg(by)
                     -  if (by == "feature") {
                     -    out <- VIM::kNN(x, ...)[, 1:ncol(x)]
                     -    ## VIM package internally converts x as data.table, which drops rownames
                     -    rownames(out) <- rownames(x)
                     -  } else {
                     -    out <- t(VIM::kNN(t(x), ...))[1:nrow(x), ]
                     -    colnames(out) <- colnames(x)
                     -  }
                     -  as.matrix(out)
                     -}
+                    -
                     -.poplin_impute_pca <- function(x, ...) {
                     -  if (!requireNamespace("pcaMethods", quietly = TRUE)) {
                     -    stop("Package 'pcaMethods' is required. Please install and try again.")
                     -  }
                     -  t(pcaMethods::pca(t(x), method = "bpca", ...)@completeObs)
                     -}
+                    -
                     -.poplin_impute_randomforest <- function(x, ...) {
                     -  if (!requireNamespace("missForest", quietly = TRUE)) {
                     -    stop("Package 'missForest' is required. Please install and try again.")
                     -  }
                     -  t(missForest::missForest(t(x), ...)$ximp)
                     -}

R/imputation-methods.R

History View file @ 492d166

@@ -2,12 +2,34 @@
                      ##'
                      ##' Missing values are frequently found in metabolomics data. The \pkg{poplin}
                      ##' package provides a few options to handle them.
                     -##'
                     +##' [poplin_impute] is a wrapper for the following set of functions:
                     +##' \describe{
                     +##' \item{\code{\link{poplin_impute_knn}}:}{
                     +##' k-nearest neighbor (KNN) imputation
                     +##' }
                     +##' \item{\code{\link{poplin_impute_pca}}:}{
                     +##' principal component analysis (PCA) imputation
                     +##' }
                     +##' \item{\code{\link{poplin_impute_randomforest}}:}{
                     +##' random forest imputation
                     +##' }
                     +##' \item{\code{\link{poplin_impute_simple}}:}{
                     +##' simple univariate imputation (e.g., half-minimum, mean, median)
                     +##' }
                     +##' }
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param method A imputation method. Default is 'pqn'.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param ... Argument passed to a specific imputation method.
                     +##' @return A matrix or \linkS4class{poplin} object of the same dimension as
                     +##'   \code{x} containing the imputed intensities.
                      ##' @name poplin_impute
                     +##' @family imputation methods
                      setMethod(
                        "poplin_impute",
                        "matrix",
                     -  function(x, method, ...) {
                     +  function(x, method = c("knn", "pca", "randomforest", "simple"), ...) {
                          .poplin_impute(x, method = method, ...)
+                       }
+                     )
@@ -16,123 +38,233 @@ setMethod(
                      setMethod(
                        "poplin_impute",
                        "poplin",
                     -  function(x, method, poplin_in, poplin_out, ...) {
                     +  function(x, method = c("knn", "pca", "randomforest", "simple"),
                     +           poplin_in, poplin_out, ...) {
                          m <- .verify_and_extract_input(x, poplin_in)
                          poplin_data(x, poplin_out) <- .poplin_impute(m, method = method, ...)
+                         x
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' K-nearest neighbor (KNN) imputation
                     +##'
                     +##' Apply k-nearest neighbor (KNN) imputation to a matrix or
                     +##' \linkS4class{poplin} object. This is an interface to the [VIM::kNN] from the
                     +##' \pkg{VIM} package. Since it is based on Gower's distance, standardization of
                     +##' input data prior to KNN imputation would not affect the result.
                     +##'
                     +##' @references
                     +##' Alexander Kowarik, Matthias Templ (2016). Imputation with the R Package VIM.
                     +##' Journal of Statistical Software, 74(7), 1-16. doi:10.18637/jss.v074.i07
                     +##'
                     +##' Gower, J. C. (1971). A General Coefficient of Similarity and Some of Its
                     +##' Properties. Biometrics, 27(4), 857–871. https://doi.org/10.2307/2528823
                     +##'
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param by Imputation by k-nearest features or by k-nearest samples.
                     +##' @param ... Additional argument passed to [VIM::kNN].
                     +##' @return A matrix or \linkS4class{poplin} object of the same dimension as
                     +##'   \code{x} containing the imputed intensities.
                     +##' @name poplin_impute_knn
                     +##' @family imputation methods
                      setMethod(
                        "poplin_impute_knn",
                        "matrix",
                     -  function(x, ...) {
                     -    .poplin_impute_knn(x, ...)
                     +  function(x, by = c("feature", "sample"),  ...) {
                     +    .poplin_impute_knn(x, by = by, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' @rdname poplin_impute_knn
                      setMethod(
                        "poplin_impute_knn",
                        "poplin",
                     -  function(x, poplin_in, poplin_out, ...) {
                     +  function(x, poplin_in, poplin_out, by = c("feature", "sample"), ...) {
                          .poplin_extract_and_assign(x, .poplin_impute_knn,
                     -                               poplin_in, poplin_out, ...)
                     +                               poplin_in, poplin_out,
                     +                               by = by, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' Random forest imputation
                     +##'
                     +##' Apply random forest imputation to a matrix or \linkS4class{poplin} object.
                     +##' This is an interface to the [missForest::missForest] from the
                     +##' \pkg{missForest} package. Since random forest is a tree-based method, it can
                     +##' be performed with raw intensities - invariant to monotonic transformations
                     +##' (However, statistical analysis could be affected because, for example,
                     +##' log(mean(predicted values) != mean(log(predicted values))).
                     +##'
                     +##' @references
                     +##'
                     +##' Daniel J. Stekhoven (2013). missForest: Nonparametric Missing Value
                     +##' Imputation using Random Forest. R package version 1.4.
                     +##'
                     +##' Stekhoven D. J., & Buehlmann, P. (2012). MissForest - non-parametric missing
                     +##' value imputation for mixed-type data. Bioinformatics, 28(1), 112-118.
                     +##'
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param ... Additional argument passed to [missForest::missForest].
                     +##' @return A matrix or \linkS4class{poplin} object of the same dimension as
                     +##'   \code{x} containing the imputed intensities.
                     +##' @name poplin_impute_randomforest
                     +##' @family imputation methods
                      setMethod(
                     -  "poplin_impute_halfmin",
                     +  "poplin_impute_randomforest",
                        "matrix",
                        function(x, ...) {
                     -    .poplin_impute_halfmin(x, ...)
                     +    .poplin_impute_randomforest(x, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' @rdname poplin_impute_randomforest
                      setMethod(
                     -  "poplin_impute_halfmin",
                     +  "poplin_impute_randomforest",
                        "poplin",
                        function(x, poplin_in, poplin_out, ...) {
                     -    .poplin_extract_and_assign(x, .poplin_impute_halfmin,
                     +    .poplin_extract_and_assign(x, .poplin_impute_randomforest,
                                                     poplin_in, poplin_out, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' Principal component analysis (PCA) imputation
                     +##'
                     +##' Apply PCA imputation to a matrix or \linkS4class{poplin} object. This is a
                     +##' interface to the [pcaMethods::pca] from the \pkg{pcaMethods} package. Here,
                     +##' features are interpreted as variables and samples as observations.
                     +##' Pre-processing of input (centering, scaling) may be necessary. See the
                     +##' documentation of [pcaMethods:pca] and [pcaMethods:prep]. Note that the PCA
                     +##' imputation could yield negative feature values that need to be
                     +##' post-processed.
                     +##'
                     +##' @references
                     +##' Stacklies, W., Redestig, H., Scholz, M., Walther, D. and Selbig, J.
                     +##' pcaMethods -- a Bioconductor package providing PCA methods for incomplete
                     +##' data. Bioinformatics, 2007, 23, 1164-1167
                     +##'
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param type A method for performing PCA.
                     +##' @param ... Additional argument passed to [pcaMethods::pca].
                     +##' @return A matrix or \linkS4class{poplin} object of the same dimension as
                     +##'   \code{x} containing the imputed intensities.
                     +##' @name poplin_impute_pca
                     +##' @family imputation methods
                      setMethod(
                     -  "poplin_impute_median",
                     +  "poplin_impute_pca",
                        "matrix",
                     -  function(x, ...) {
                     -    .poplin_impute_median(x, ...)
                     +  function(x, type = c("bpca", "ppca", "nipals", "svdImpute"), ...) {
                     +    .poplin_impute_pca(x, type = type, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' @rdname poplin_impute_pca
                      setMethod(
                     -  "poplin_impute_median",
                     +  "poplin_impute_pca",
                        "poplin",
                     -  function(x, poplin_in, poplin_out, ...) {
                     -    .poplin_extract_and_assign(x, .poplin_impute_median,
                     -                               poplin_in, poplin_out, ...)
                     +  function(x, poplin_in, poplin_out,
                     +           type = c("bpca", "ppca", "nipals", "svdImpute"), ...) {
                     +    .poplin_extract_and_assign(x, .poplin_impute_pca,
                     +                               poplin_in, poplin_out,
                     +                               type = type, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' Simple univariate imputation
                     +##'
                     +##' Apply univariate imputation to a matrix or \linkS4class{poplin} object. The
                     +##' supported methods include
                     +##' \itemize{
                     +##' \item Half-minimum imputation: for each feature, missing values are replaced
                     +##' with half the observed minimum.
                     +##' \item Median imputation: for each feature, missing values are replaced with
                     +##' the median of non-missing values.
                     +##' \item Mean imputation: for each feature, missing values are replaced with
                     +##' the mean of non-missing values.
                     +##' }
                     +##' @references
                     +##' Wei, R., Wang, J., Su, M. et al. Missing Value Imputation Approach for Mass
                     +##' Spectrometry-based Metabolomics Data. Sci Rep 8, 663 (2018).
                     +##' https://doi.org/10.1038/s41598-017-19120-0
                     +##'
                     +##' @param x A matrix or \linkS4class{poplin} object.
                     +##' @param poplin_in Name of a data matrix to retrieve.
                     +##' @param poplin_out Name of a data matrix to store.
                     +##' @param type A method for doing univariate imputation.
                     +##' @return A matrix or \linkS4class{poplin} object of the same dimension as
                     +##'   \code{x} containing the imputed intensities.
                     +##' @name poplin_impute_simple
                     +##' @family imputation methods
                      setMethod(
                     -  "poplin_impute_mean",
                     +  "poplin_impute_simple",
                        "matrix",
                     -  function(x, ...) {
                     -    .poplin_impute_mean(x, ...)
                     +  function(x, type = c("halfmin", "median", "mean")) {
                     +    .poplin_impute_simple(x, type = type)
+                       }
+                     )
                     -##' @rdname poplin_impute
                     +##' @rdname poplin_impute_simple
                      setMethod(
                     -  "poplin_impute_mean",
                     +  "poplin_impute_simple",
                        "poplin",
                     -  function(x, poplin_in, poplin_out, ...) {
                     -    .poplin_extract_and_assign(x, .poplin_impute_mean,
                     -                               poplin_in, poplin_out, ...)
                     +  function(x, poplin_in, poplin_out, type = c("halfmin", "median", "mean")) {
                     +    .poplin_extract_and_assign(x, .poplin_impute_halfmin,
                     +                               poplin_in, poplin_out, type = type)
+                       }
+                     )
                     -##' @rdname poplin_impute
                      setMethod(
                     -  "poplin_impute_pca",
                     +  "poplin_impute_halfmin",
                     +  "matrix",
                     +  function(x) {
                     +    .poplin_impute_halfmin(x)
                     +  }
                     +)
+                    +
                     +setMethod(
                     +  "poplin_impute_halfmin",
                     +  "poplin",
                     +  function(x, poplin_in, poplin_out) {
                     +    .poplin_extract_and_assign(x, .poplin_impute_halfmin,
                     +                               poplin_in, poplin_out)
                     +  }
                     +)
+                    +
                     +setMethod(
                     +  "poplin_impute_median",
                        "matrix",
                        function(x, ...) {
                     -    .poplin_impute_pca(x, ...)
                     +    .poplin_impute_median(x, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                      setMethod(
                     -  "poplin_impute_pca",
                     +  "poplin_impute_median",
                        "poplin",
                        function(x, poplin_in, poplin_out, ...) {
                     -    .poplin_extract_and_assign(x, .poplin_impute_pca,
                     +    .poplin_extract_and_assign(x, .poplin_impute_median,
                                                     poplin_in, poplin_out, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                      setMethod(
                     -  "poplin_impute_randomforest",
                     +  "poplin_impute_mean",
                        "matrix",
                        function(x, ...) {
                     -    .poplin_impute_randomforest(x, ...)
                     +    .poplin_impute_mean(x, ...)
+                       }
+                     )
                     -##' @rdname poplin_impute
                      setMethod(
                     -  "poplin_impute_randomforest",
                     +  "poplin_impute_mean",
                        "poplin",
                        function(x, poplin_in, poplin_out, ...) {
                     -    .poplin_extract_and_assign(x, .poplin_impute_randomforest,
                     +    .poplin_extract_and_assign(x, .poplin_impute_mean,
                                                     poplin_in, poplin_out, ...)
+                       }
+                     )

R/normalization-functions.R

History View file @ 492d166

@@ -394,7 +394,7 @@
     range = .poplin_normalize_range(x),
     pareto = .poplin_normalize_pareto(x),
     vast = .poplin_normalize_vast(x),
-    level = .poplin_normalize_level(x),
+    level = .poplin_normalize_level(x)
   )
 }
 

R/normalization-methods.R

History View file @ 492d166

@@ -63,13 +63,13 @@ setMethod(
                      ##' Probabilistic quotient normalization (PQN)
                      ##'
                     -##' Apply probabilistic quotient normalization to a matrix or
                     +##' Apply probabilistic quotient normalization (PQN) to a matrix or
                      ##' \linkS4class{poplin} object. For the calculation of quotients, a reference
                      ##' spectrum needs to be obtained from a mean or median spectrum based on all
                      ##' spectra of the study or a subset of the study. Feature intensities are
                      ##' normalized by the median of quotients. See Dieterle et al. (2006) for
                      ##' details.
                     -##'
                     +##'
                      ##' @param x A matrix or \linkS4class{poplin} object.
                      ##' @param poplin_in Name of a data matrix to retrieve.
                      ##' @param poplin_out Name of a data matrix to store.
@@ -116,7 +116,7 @@ setMethod(
                      ##' Apply sum normalization to a matrix or \linkS4class{poplin} object. For each
                      ##' sample, feature intensities are divided by its Total Ion Current (TIC),
                      ##' i.e., every feature is divided by the sum of all intensity values.
                     -##'
                     +##'
                      ##' @param x A matrix or \linkS4class{poplin} object.
                      ##' @param poplin_in Name of a data matrix to retrieve.
                      ##' @param poplin_out Name of a data matrix to store.
@@ -153,7 +153,7 @@ setMethod(
                      ##' Apply mean normalization to a matrix or \linkS4class{poplin} object. For
                      ##' each sample, feature intensities are divided by its mean. The mean of
                      ##' intensity values for individual samples will be one as a result.
                     -##'
                     +##'
                      ##' @param x A matrix or \linkS4class{poplin} object.
                      ##' @param poplin_in Name of a data matrix to retrieve.
                      ##' @param poplin_out Name of a data matrix to store.
@@ -190,7 +190,7 @@ setMethod(
                      ##' Apply median normalization to a matrix or \linkS4class{poplin} object. For
                      ##' each sample, feature intensities are divided by its median. The median of
                      ##' intensity values for individual samples will be one as a result.
                     -##'
                     +##'
                      ##' @param x A matrix or \linkS4class{poplin} object.
                      ##' @param poplin_in Name of a data matrix to retrieve.
                      ##' @param poplin_out Name of a data matrix to store.
@@ -228,7 +228,7 @@ setMethod(
                      ##' \linkS4class{poplin} object. For each sample, feature intensities are scaled
                      ##' by its MAD. The MAD of intensity values for individual samples will be one
                      ##' as a result.
                     -##'
                     +##'
                      ##' @param x A matrix or \linkS4class{poplin} object.
                      ##' @param poplin_in Name of a data matrix to retrieve.
                      ##' @param poplin_out Name of a data matrix to store.
@@ -347,7 +347,7 @@ setMethod(
                      ##' from the \pkg{vsn} package (see [vsn::vsn2] for help). The vsn produces
                      ##' normalized intensities based on a glog (generalized logarithm) scale to base
                      ##' 2. See Huber et al. (2002) for details.
                     -##'
                     +##'
                      ##' @references
                      ##' Huber W, von Heydebreck A, Sültmann H, Poustka A, Vingron M. Variance
                      ##' stabilization applied to microarray data calibration and to the
@@ -384,7 +384,7 @@ setMethod(
+                     )
                      ##' Feature-based scaling
                     -##'
                     +##'
                      ##' Apply feature-based scaling to a matrix or \linkS4class{poplin} object. The
                      ##' supported methods include
                      ##' \itemize{

man/poplin_impute.Rd

History View file @ 492d166

@@ -3,49 +3,57 @@
                      \name{poplin_impute}
                      \alias{poplin_impute}
                      \alias{poplin_impute,poplin-method}
                     -\alias{poplin_impute_knn,matrix-method}
                     -\alias{poplin_impute_knn,poplin-method}
                     -\alias{poplin_impute_halfmin,matrix-method}
                     -\alias{poplin_impute_halfmin,poplin-method}
                     -\alias{poplin_impute_median,matrix-method}
                     -\alias{poplin_impute_median,poplin-method}
                     -\alias{poplin_impute_mean,matrix-method}
                     -\alias{poplin_impute_mean,poplin-method}
                     -\alias{poplin_impute_pca,matrix-method}
                     -\alias{poplin_impute_pca,poplin-method}
                     -\alias{poplin_impute_randomforest,matrix-method}
                     -\alias{poplin_impute_randomforest,poplin-method}
                      \title{Imputation methods}
                      \usage{
                     -\S4method{poplin_impute}{matrix}(x, method, ...)
+                    -
                     -\S4method{poplin_impute}{poplin}(x, method, poplin_in, poplin_out, ...)
+                    -
                     -\S4method{poplin_impute_knn}{matrix}(x, ...)
+                    -
                     -\S4method{poplin_impute_knn}{poplin}(x, poplin_in, poplin_out, ...)
+                    -
                     -\S4method{poplin_impute_halfmin}{matrix}(x, ...)
+                    -
                     -\S4method{poplin_impute_halfmin}{poplin}(x, poplin_in, poplin_out, ...)
+                    -
                     -\S4method{poplin_impute_median}{matrix}(x, ...)
+                    -
                     -\S4method{poplin_impute_median}{poplin}(x, poplin_in, poplin_out, ...)
+                    -
                     -\S4method{poplin_impute_mean}{matrix}(x, ...)
+                    -
                     -\S4method{poplin_impute_mean}{poplin}(x, poplin_in, poplin_out, ...)
                     +\S4method{poplin_impute}{matrix}(x, method = c("knn", "pca", "randomforest", "simple"), ...)
+                    +
                     +\S4method{poplin_impute}{poplin}(
                     +  x,
                     +  method = c("knn", "pca", "randomforest", "simple"),
                     +  poplin_in,
                     +  poplin_out,
                     +  ...
                     +)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
                     -\S4method{poplin_impute_pca}{matrix}(x, ...)
                     +\item{method}{A imputation method. Default is 'pqn'.}
                     -\S4method{poplin_impute_pca}{poplin}(x, poplin_in, poplin_out, ...)
                     +\item{...}{Argument passed to a specific imputation method.}
                     -\S4method{poplin_impute_randomforest}{matrix}(x, ...)
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
                     -\S4method{poplin_impute_randomforest}{poplin}(x, poplin_in, poplin_out, ...)
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A matrix or \linkS4class{poplin} object of the same dimension as
                     +\code{x} containing the imputed intensities.
+                     }
                      \description{
                      Missing values are frequently found in metabolomics data. The \pkg{poplin}
                      package provides a few options to handle them.
                     +\link{poplin_impute} is a wrapper for the following set of functions:
                     +\describe{
                     +\item{\code{\link{poplin_impute_knn}}:}{
                     +k-nearest neighbor (KNN) imputation
                     +}
                     +\item{\code{\link{poplin_impute_pca}}:}{
                     +principal component analysis (PCA) imputation
                     +}
                     +\item{\code{\link{poplin_impute_randomforest}}:}{
                     +random forest imputation
                     +}
                     +\item{\code{\link{poplin_impute_simple}}:}{
                     +simple univariate imputation (e.g., half-minimum, mean, median)
                     +}
                     +}
                     +}
                     +\seealso{
                     +Other imputation methods:
                     +\code{\link{poplin_impute_knn}()},
                     +\code{\link{poplin_impute_pca}()},
                     +\code{\link{poplin_impute_randomforest}()},
                     +\code{\link{poplin_impute_simple}()}
+                     }
                     +\concept{imputation methods}

man/poplin_impute_knn.Rd

History View file @ 492d166

                     new file mode 100644
@@ -0,0 +1,47 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/imputation-methods.R
                     +\name{poplin_impute_knn}
                     +\alias{poplin_impute_knn}
                     +\alias{poplin_impute_knn,poplin-method}
                     +\title{K-nearest neighbor (KNN) imputation}
                     +\usage{
                     +\S4method{poplin_impute_knn}{matrix}(x, by = c("feature", "sample"), ...)
+                    +
                     +\S4method{poplin_impute_knn}{poplin}(x, poplin_in, poplin_out, by = c("feature", "sample"), ...)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
+                    +
                     +\item{by}{Imputation by k-nearest features or by k-nearest samples.}
+                    +
                     +\item{...}{Additional argument passed to \link[VIM:kNN]{VIM::kNN}.}
+                    +
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
+                    +
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A matrix or \linkS4class{poplin} object of the same dimension as
                     +\code{x} containing the imputed intensities.
                     +}
                     +\description{
                     +Apply k-nearest neighbor (KNN) imputation to a matrix or
                     +\linkS4class{poplin} object. This is an interface to the \link[VIM:kNN]{VIM::kNN} from the
                     +\pkg{VIM} package. Since it is based on Gower's distance, standardization of
                     +input data prior to KNN imputation would not affect the result.
                     +}
                     +\references{
                     +Alexander Kowarik, Matthias Templ (2016). Imputation with the R Package VIM.
                     +Journal of Statistical Software, 74(7), 1-16. doi:10.18637/jss.v074.i07
+                    +
                     +Gower, J. C. (1971). A General Coefficient of Similarity and Some of Its
                     +Properties. Biometrics, 27(4), 857–871. https://doi.org/10.2307/2528823
                     +}
                     +\seealso{
                     +Other imputation methods:
                     +\code{\link{poplin_impute_pca}()},
                     +\code{\link{poplin_impute_randomforest}()},
                     +\code{\link{poplin_impute_simple}()},
                     +\code{\link{poplin_impute}()}
                     +}
                     +\concept{imputation methods}

man/poplin_impute_pca.Rd

History View file @ 492d166

                     new file mode 100644
@@ -0,0 +1,54 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/imputation-methods.R
                     +\name{poplin_impute_pca}
                     +\alias{poplin_impute_pca}
                     +\alias{poplin_impute_pca,poplin-method}
                     +\title{Principal component analysis (PCA) imputation}
                     +\usage{
                     +\S4method{poplin_impute_pca}{matrix}(x, type = c("bpca", "ppca", "nipals", "svdImpute"), ...)
+                    +
                     +\S4method{poplin_impute_pca}{poplin}(
                     +  x,
                     +  poplin_in,
                     +  poplin_out,
                     +  type = c("bpca", "ppca", "nipals", "svdImpute"),
                     +  ...
                     +)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
+                    +
                     +\item{type}{A method for performing PCA.}
+                    +
                     +\item{...}{Additional argument passed to \link[pcaMethods:pca]{pcaMethods::pca}.}
+                    +
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
+                    +
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A matrix or \linkS4class{poplin} object of the same dimension as
                     +\code{x} containing the imputed intensities.
                     +}
                     +\description{
                     +Apply PCA imputation to a matrix or \linkS4class{poplin} object. This is a
                     +interface to the \link[pcaMethods:pca]{pcaMethods::pca} from the \pkg{pcaMethods} package. Here,
                     +features are interpreted as variables and samples as observations.
                     +Pre-processing of input (centering, scaling) may be necessary. See the
                     +documentation of \link{pcaMethods:pca} and \link{pcaMethods:prep}. Note that the PCA
                     +imputation could yield negative feature values that need to be
                     +post-processed.
                     +}
                     +\references{
                     +Stacklies, W., Redestig, H., Scholz, M., Walther, D. and Selbig, J.
                     +pcaMethods -- a Bioconductor package providing PCA methods for incomplete
                     +data. Bioinformatics, 2007, 23, 1164-1167
                     +}
                     +\seealso{
                     +Other imputation methods:
                     +\code{\link{poplin_impute_knn}()},
                     +\code{\link{poplin_impute_randomforest}()},
                     +\code{\link{poplin_impute_simple}()},
                     +\code{\link{poplin_impute}()}
                     +}
                     +\concept{imputation methods}

man/poplin_impute_randomforest.Rd

History View file @ 492d166

                     new file mode 100644
@@ -0,0 +1,47 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/imputation-methods.R
                     +\name{poplin_impute_randomforest}
                     +\alias{poplin_impute_randomforest}
                     +\alias{poplin_impute_randomforest,poplin-method}
                     +\title{Random forest imputation}
                     +\usage{
                     +\S4method{poplin_impute_randomforest}{matrix}(x, ...)
+                    +
                     +\S4method{poplin_impute_randomforest}{poplin}(x, poplin_in, poplin_out, ...)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
+                    +
                     +\item{...}{Additional argument passed to \link[missForest:missForest]{missForest::missForest}.}
+                    +
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
+                    +
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A matrix or \linkS4class{poplin} object of the same dimension as
                     +\code{x} containing the imputed intensities.
                     +}
                     +\description{
                     +Apply random forest imputation to a matrix or \linkS4class{poplin} object.
                     +This is an interface to the \link[missForest:missForest]{missForest::missForest} from the
                     +\pkg{missForest} package. Since random forest is a tree-based method, it can
                     +be performed with raw intensities - invariant to monotonic transformations
                     +(However, statistical analysis could be affected because, for example,
                     +log(mean(predicted values) != mean(log(predicted values))).
                     +}
                     +\references{
                     +Daniel J. Stekhoven (2013). missForest: Nonparametric Missing Value
                     +Imputation using Random Forest. R package version 1.4.
+                    +
                     +Stekhoven D. J., & Buehlmann, P. (2012). MissForest - non-parametric missing
                     +value imputation for mixed-type data. Bioinformatics, 28(1), 112-118.
                     +}
                     +\seealso{
                     +Other imputation methods:
                     +\code{\link{poplin_impute_knn}()},
                     +\code{\link{poplin_impute_pca}()},
                     +\code{\link{poplin_impute_simple}()},
                     +\code{\link{poplin_impute}()}
                     +}
                     +\concept{imputation methods}

man/poplin_impute_simple.Rd

History View file @ 492d166

                     new file mode 100644
@@ -0,0 +1,54 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/imputation-methods.R
                     +\name{poplin_impute_simple}
                     +\alias{poplin_impute_simple}
                     +\alias{poplin_impute_simple,poplin-method}
                     +\title{Simple univariate imputation}
                     +\usage{
                     +\S4method{poplin_impute_simple}{matrix}(x, type = c("halfmin", "median", "mean"))
+                    +
                     +\S4method{poplin_impute_simple}{poplin}(
                     +  x,
                     +  poplin_in,
                     +  poplin_out,
                     +  type = c("halfmin", "median", "mean")
                     +)
                     +}
                     +\arguments{
                     +\item{x}{A matrix or \linkS4class{poplin} object.}
+                    +
                     +\item{type}{A method for doing univariate imputation.}
+                    +
                     +\item{poplin_in}{Name of a data matrix to retrieve.}
+                    +
                     +\item{poplin_out}{Name of a data matrix to store.}
                     +}
                     +\value{
                     +A matrix or \linkS4class{poplin} object of the same dimension as
                     +\code{x} containing the imputed intensities.
                     +}
                     +\description{
                     +Apply univariate imputation to a matrix or \linkS4class{poplin} object. The
                     +supported methods include
                     +\itemize{
                     +\item Half-minimum imputation: for each feature, missing values are replaced
                     +with half the observed minimum.
                     +\item Median imputation: for each feature, missing values are replaced with
                     +the median of non-missing values.
                     +\item Mean imputation: for each feature, missing values are replaced with
                     +the mean of non-missing values.
                     +}
                     +}
                     +\references{
                     +Wei, R., Wang, J., Su, M. et al. Missing Value Imputation Approach for Mass
                     +Spectrometry-based Metabolomics Data. Sci Rep 8, 663 (2018).
                     +https://doi.org/10.1038/s41598-017-19120-0
                     +}
                     +\seealso{
                     +Other imputation methods:
                     +\code{\link{poplin_impute_knn}()},
                     +\code{\link{poplin_impute_pca}()},
                     +\code{\link{poplin_impute_randomforest}()},
                     +\code{\link{poplin_impute}()}
                     +}
                     +\concept{imputation methods}

man/poplin_normalize_pqn.Rd

History View file @ 492d166

@@ -43,7 +43,7 @@ A matrix or \linkS4class{poplin} object of the same dimension as
                      \code{x} containing the normalized intensities.
+                     }
                      \description{
                     -Apply probabilistic quotient normalization to a matrix or
                     +Apply probabilistic quotient normalization (PQN) to a matrix or
                      \linkS4class{poplin} object. For the calculation of quotients, a reference
                      spectrum needs to be obtained from a mean or median spectrum based on all
                      spectra of the study or a subset of the study. Feature intensities are

...	...	@@ -394,7 +394,7 @@
394	394	range = .poplin_normalize_range(x),
395	395	pareto = .poplin_normalize_pareto(x),
396	396	vast = .poplin_normalize_vast(x),
397		- level = .poplin_normalize_level(x),
	397	+ level = .poplin_normalize_level(x)
398	398	)
399	399	}
400	400