Bioconductor Code: GSVA

Browse code

Added gsvaEnrichment() method, gsvaRanks() returns a new class gsvaRanksParam object, which is now input for gsvaScores(). Added unit tests and documentation

Robert Castelo authored on 20/10/2024 19:09:26
Showing 11 changed files

NAMESPACE index 3b786256b..556b4e08f 100644
R/AllClasses.R index 6b59a53a9..56ae72251 100644
R/AllGenerics.R index b32219638..bc4b4b048 100644
R/gsva.R index 0559f717c..c3a1384e8 100644
R/gsvaNewAPI.R index 0b1051446..4f39700a8 100644
R/gsvaParam.R index f6e361848..976300112 100644
R/utils.R index 942db51e5..29d80c3d1 100644
inst/unitTests/test_gsvaRanks.R index d85117548..ccf594334 100644
man/gsvaEnrichment.Rd index 000000000..6b4e48469
man/gsvaParam-class.Rd index 6aedc1dd7..e82f698c7 100644
man/gsvaRanks.Rd index 76d829341..174911a90 100644

History View file @ 1d874ee01

@@ -1,5 +1,6 @@
                      # Generated by roxygen2: do not edit by hand
                     +export("geneSets<-")
                      export("gsvaAnnotation<-")
                      export(computeGeneSetsOverlap)
                      export(deduplicateGeneSets)
@@ -9,6 +10,7 @@ export(geneSetSizes)
                      export(geneSets)
                      export(gsva)
                      export(gsvaAnnotation)
                     +export(gsvaEnrichment)
                      export(gsvaParam)
                      export(gsvaRanks)
                      export(gsvaScores)
@@ -23,6 +25,7 @@ exportClasses(GsvaExprData)
                      exportClasses(GsvaGeneSets)
                      exportClasses(GsvaMethodParam)
                      exportClasses(gsvaParam)
                     +exportClasses(gsvaRanksParam)
                      exportClasses(plageParam)
                      exportClasses(ssgseaParam)
                      exportClasses(zscoreParam)
@@ -84,13 +87,18 @@ importFrom(SpatialExperiment,SpatialExperiment)
                      importFrom(SummarizedExperiment,SummarizedExperiment)
                      importFrom(SummarizedExperiment,assay)
                      importFrom(cli,cli_abort)
                     +importFrom(cli,cli_alert_danger)
                      importFrom(cli,cli_alert_info)
                      importFrom(cli,cli_alert_success)
                      importFrom(cli,cli_alert_warning)
                      importFrom(cli,cli_progress_bar)
                      importFrom(cli,cli_progress_done)
                      importFrom(cli,cli_progress_update)
                     +importFrom(graphics,abline)
                     +importFrom(graphics,grid)
                     +importFrom(graphics,lines)
                      importFrom(graphics,plot)
                     +importFrom(graphics,segments)
                      importFrom(methods,new)
                      importFrom(parallel,splitIndices)
                      importFrom(sparseMatrixStats,colRanks)
@@ -103,6 +111,7 @@ importFrom(stats,rnorm)
                      importFrom(stats,rpois)
                      importFrom(stats,sd)
                      importFrom(utils,capture.output)
                     +importFrom(utils,globalVariables)
                      importFrom(utils,head)
                      importFrom(utils,installed.packages)
                      importFrom(utils,packageDescription)

R/AllClasses.R

History View file @ 1d874ee01

@@ -336,3 +336,21 @@ setClass("gsvaParam",
                                              maxDiff=NA,
                                              absRanking=NA,
                                              sparse=FALSE))
+                    +
                     +#' @name gsvaRanksParam-class
                     +#' @rdname gsvaParam-class
                     +#' @exportClass gsvaRanksParam
                     +setClass("gsvaRanksParam",
                     +         contains="gsvaParam",
                     +         prototype=list(exprData=NULL,
                     +                        geneSets=NULL,
                     +                        assay=NA_character_,
                     +                        annotation=NULL,
                     +                        minSize=NA_integer_,
                     +                        maxSize=NA_integer_,
                     +                        kcdf=NA_character_,
                     +                        kcdfNoneMinSampleSize=NA_integer_,
                     +                        tau=NA_real_,
                     +                        maxDiff=NA,
                     +                        absRanking=NA,
                     +                        sparse=FALSE))

R/AllGenerics.R

History View file @ 1d874ee01

@@ -9,7 +9,11 @@ setGeneric("gsvaRanks",
                      #' @export
                      setGeneric("gsvaScores",
                     -           function(param, ranks, ...) standardGeneric("gsvaScores"))
                     +           function(param, ...) standardGeneric("gsvaScores"))
+                    +
                     +#' @export
                     +setGeneric("gsvaEnrichment",
                     +           function(param, ranks, ...) standardGeneric("gsvaEnrichment"))
                      #' @export
                      setGeneric("filterGeneSets",
@@ -23,6 +27,10 @@ setGeneric("computeGeneSetsOverlap",
                      setGeneric("geneSets",
                                 function(obj, ...) standardGeneric("geneSets"))
                     +#' @export
                     +setGeneric("geneSets<-",
                     +           function(object, value) standardGeneric("geneSets<-"))
+                    +
                      #' @export
                      setGeneric("geneSetSizes",
                                 function(obj, ...) standardGeneric("geneSetSizes"))

R/gsva.R

History View file @ 1d874ee01

@@ -301,8 +301,8 @@ compute.geneset.es <- function(expr, gset.idx.list, sample.idxs, kcdf,
                      #' ranks; and (2) calculate GSVA scores using the previously calculated
                      #' ranks.
                      #'
                     -#' @param param A [`gsvaParam`] object built using the constructor function
                     -#' [`gsvaParam`].
                     +#' @param param A [`gsvaParam-class`] object built using the constructor
                     +#' function [`gsvaParam`].
                      #'
                      #' @param verbose Gives information about each calculation step. Default: `TRUE`.
                      #'
@@ -310,10 +310,10 @@ compute.geneset.es <- function(expr, gset.idx.list, sample.idxs, kcdf,
                      #'   related to the parallel execution of some of the tasks and calculations
                      #'   within this function.
                      #'
                     -#' @return In the case of the `gsvaRanks()` method, a matrix of GSVA rank
                     -#' values per column.
                     +#' @return In the case of the `gsvaRanks()` method, an object of class
                     +#' [`gsvaRanksParam-class`].
                      #'
                     -#' @seealso [`gsvaParam`], [`gsva`]
                     +#' @seealso [`gsvaParam-class`], [`gsvaRanksParam-class`], [`gsva`]
                      #'
                      #' @aliases gsvaRanks,gsvaParam-method
                      #' @name gsvaRanks
@@ -341,14 +341,17 @@ compute.geneset.es <- function(expr, gset.idx.list, sample.idxs, kcdf,
                      #' y <- matrix(rnorm(n*p), nrow=p, ncol=n,
                      #'             dimnames=list(paste("g", 1:p, sep="") , paste("s", 1:n, sep="")))
                      #'
                     +#' ## genes in set1 are expressed at higher levels in the last 'nGrp1+1' to 'n' samples
                     +#' y[geneSets$set1, (nGrp1+1):n] <- y[geneSets$set1, (nGrp1+1):n] + 2
                     +#'
                      #' ## build GSVA parameter object
                      #' gsvapar <- gsvaParam(y, geneSets)
                      #'
                      #' ## calculate GSVA ranks
                     -#' gsva_ranks <- gsvaRanks(gsvapar)
                     -#' gsva_ranks
                     +#' gsvarankspar <- gsvaRanks(gsvapar)
                     +#' gsvarankspar
                      #' ## calculate GSVA scores
                     -#' gsva_es <- gsvaScores(gsvapar, gsva_ranks)
                     +#' gsva_es <- gsvaScores(gsvarankspar)
                      #' gsva_es
                      #'
                      #' ## calculate now GSVA scores in a single step
@@ -362,7 +365,8 @@ compute.geneset.es <- function(expr, gset.idx.list, sample.idxs, kcdf,
                      #'                   gset2=paste0("g", c(1, 2, 7, 8)))
                      #'
                      #' ## note that there is no need to calculate the GSVA ranks again
                     -#' gsvaScores(gsvapar, gsva_ranks, geneSets2)
                     +#' geneSets(gsvarankspar) <- geneSets2
                     +#' gsvaScores(gsvarankspar)
                      #'
                      #' @importFrom cli cli_alert_info cli_alert_success
                      #' @importFrom BiocParallel bpnworkers
@@ -393,20 +397,30 @@ setMethod("gsvaRanks", signature(param="gsvaParam"),
                                    psz <- if(inherits(BPPARAM, "SerialParam")) 1L else bpnworkers(BPPARAM)
                     -              gsva_rnk <- .compute_gsva_ranks(expr=filteredDataMatrix,
                     +              gsvarnks <- .compute_gsva_ranks(expr=filteredDataMatrix,
                                                                    kcdf=get_kcdf(param),
                                                                    kcdf.min.ssize=get_kcdfNoneMinSampleSize(param),
                                                                    sparse=get_sparse(param),
                                                                    verbose=verbose,
                                                                    BPPARAM=BPPARAM)
                     -              rownames(gsva_rnk) <- rownames(filteredDataMatrix)
                     -              colnames(gsva_rnk) <- colnames(filteredDataMatrix)
                     +              rownames(gsvarnks) <- rownames(filteredDataMatrix)
                     +              colnames(gsvarnks) <- colnames(filteredDataMatrix)
+                    +
                     +              rnkcontainer <- wrapData(get_exprData(param), gsvarnks)
                     +              rval <- new("gsvaRanksParam",
                     +                          exprData=rnkcontainer, geneSets=get_geneSets(param),
                     +                          assay="gsvaranks", annotation=get_annotation(param),
                     +                          minSize=get_minSize(param), maxSize=get_maxSize(param),
                     +                          kcdf=get_kcdf(param),
                     +                          kcdfNoneMinSampleSize=get_kcdfNoneMinSampleSize(param),
                     +                          tau=get_tau(param), maxDiff=get_maxDiff(param),
                     +                          absRanking=get_absRanking(param), sparse=get_sparse(param))
                                    if (verbose)
                                        cli_alert_success("Calculations finished")
                     -              return(gsva_rnk)
                     +              return(rval)
                                })
                      .check_geneSets_minSize_maxSize_tau <- function(geneSets, minSize, maxSize, tau) {
@@ -467,56 +481,24 @@ setMethod("gsvaRanks", signature(param="gsvaParam"),
+                     }
                     -#' @param ranks A matrix-like object storing GSVA ranks calculated with the
                     -#' method [`gsvaRanks`].
                     -#'
                     -#' @param geneSets A collection of gene sets. Must be one of the classes
                     -#' supported by [`GsvaGeneSets-class`]. For a list of these classes, see its
                     -#' help page using `help(GsvaGeneSets)`. By default, this parameter is set to
                     -#' the `NA` missing value, which means that GSVA scores will be calculated
                     -#' using the gene sets specified in the `param` argument. If this parameter is
                     -#' set to a non-missing value corresponding to an object of the classes
                     -#' supported by [`GsvaGeneSets-class`], then GSVA scores will be calculated
                     -#' using the gene sets in this argument, instead of the ones specified in the
                     -#' `param` argument.
                     -#'
                     -#' @param minSize Numeric vector of length 1.  Minimum size of the resulting gene
                     -#' sets after gene identifier mapping. Its default value is `NA`, indicating that
                     -#' this minimum value will be taken from the input `param` argument, otherwise,
                     -#' non-`NA` values override those from the input `param` argument.
                     -#'
                     -#' @param maxSize Numeric vector of length 1.  Minimum size of the resulting gene
                     -#' sets after gene identifier mapping. Its default value is `NA`, indicating that
                     -#' this minimum value will be taken from the input `param` argument, otherwise,
                     -#' non-`NA` values override those from the input `param` argument.
                     -#'
                     -#' @param tau Numeric vector of length 1.  The exponent defining the weight of
                     -#' the tail in the random walk performed by the `GSVA` (Hänzelmann et al.,
                     -#' 2013) method.  The default value is 1 as described in the paper.
                     -#'
                     -#' @param maxDiff Logical vector of length 1 which offers two approaches to
                     -#' calculate the enrichment statistic (ES) from the KS random walk statistic.
                     -#' * `FALSE`: ES is calculated as the maximum distance of the random walk
                     -#' from 0. This approach produces a distribution of enrichment scores that is
                     -#' bimodal, but it can give large enrichment scores to gene sets whose genes
                     -#' are not concordantly activated in one direction only.
                     -#' * `TRUE` (the default): ES is calculated as the magnitude difference between
                     -#' the largest positive and negative random walk deviations. This default value
                     -#' gives larger enrichment scores to gene sets whose genes are concordantly
                     -#' activated in one direction only.
                     -#'
                     -#' @param absRanking Logical vector of length 1 used only when `maxDiff=TRUE`.
                     -#' When `absRanking=FALSE` (default) a modified Kuiper statistic is used to
                     -#' calculate enrichment scores, taking the magnitude difference between the
                     -#' largest positive and negative random walk deviations. When
                     -#' `absRanking=TRUE` the original Kuiper statistic that sums the largest
                     -#' positive and negative random walk deviations is used.
                     +#' @param param A parameter object of the [`gsvaRanksParam-class`] class.
                      #'
                      #' @return In the case of the `gsvaScores()` method, a gene-set by sample matrix
                     -#' of GSVA enrichment scores stored in a ocntainer object of the same type as
                     -#' the input expression data container in the `param` argument.
                     +#' of GSVA enrichment scores stored in a container object of the same type as
                     +#' the input ranks data container. If
                     +#' the input was a base matrix or a [`dgCMatrix-class`] object, then the output will
                     +#' be a base matrix object with the gene sets employed in the calculations
                     +#' stored in an attribute called `geneSets`. If the input was an
                     +#' [`ExpressionSet`] object, then the output will be also an [`ExpressionSet`]
                     +#' object with the gene sets employed in the calculations stored in an
                     +#' attributed called `geneSets`. If the input was an object of one of the
                     +#' classes described in [`GsvaExprData`], such as a [`SingleCellExperiment`],
                     +#' then the output will be of the same class, where enrichment scores will be
                     +#' stored in an assay called `es` and the gene sets employed in the
                     +#' calculations will be stored in the `rowData` slot of the object under the
                     +#' column name `gs`.
                      #'
                     -#' @aliases gsvaScores,gsvaParam,GsvaExprData-method
                     +#' @aliases gsvaScores,gsvaRanksParam-method
                      #' @name gsvaScores
                      #' @rdname gsvaRanks
                      #'
@@ -524,42 +506,20 @@ setMethod("gsvaRanks", signature(param="gsvaParam"),
                      #' @importFrom BiocParallel bpnworkers
                      #' @importFrom utils packageDescription
                      #' @exportMethod gsvaScores
                     -setMethod("gsvaScores", signature(param="gsvaParam", ranks="GsvaExprData"),
                     -          function(param, ranks, geneSets=NA, minSize=NA, maxSize=NA,
                     -                   tau=NA, maxDiff=NA, absRanking=NA,
                     -                   verbose=TRUE, BPPARAM=SerialParam(progressbar=verbose))
                     +setMethod("gsvaScores", signature(param="gsvaRanksParam"),
                     +          function(param, verbose=TRUE,
                     +                   BPPARAM=SerialParam(progressbar=verbose))
+                               {
                                    if (verbose)
                                        cli_alert_info(sprintf("GSVA version %s",
                                                               packageDescription("GSVA")[["Version"]]))
                     -              .check_geneSets_minSize_maxSize_tau(geneSets, minSize, maxSize, tau)
+                    -
                     -              .check_maxDiff_absRanking(maxDiff, absRanking)
+                    -
                     -              tau <- ifelse(is.na(tau), get_tau(param), tau)
                     -              maxDiff <- ifelse(is.na(maxDiff), get_maxDiff(param), maxDiff)
                     -              absRanking <- ifelse(is.na(absRanking), get_absRanking(param),
                     -                                   absRanking)
                     -              sparse <- get_sparse(param) ## sparse regime from parameter obj
+                    -
                     +              ## assuming rows in the rank data have been already filtered
                                    exprData <- get_exprData(param)
                     -              dataMatrix <- unwrapData(exprData, get_assay(param))
                     -              filteredDataMatrix <- .filterGenes(dataMatrix,
                     -                                                 removeConstant=TRUE,
                     -                                                 removeNzConstant=TRUE)
+                    -
                     -              if (!identical(rownames(filteredDataMatrix),
                     -                             rownames(unwrapData(ranks)))) {
                     -                  msg <- paste("Rownames in ranks don't match those from the",
                     -                               "input expression data in 'param'")
                     -                  cli_abort(c("x"=msg))
                     -              }
+                    -
                     -              filteredMappedGeneSets <- .filterAndMapGeneSets(param, geneSets,
                     -                                                              minSize, maxSize,
                     -                                                              filteredDataMatrix,
                     -                                                              verbose)
                     +              filteredDataMatrix <- unwrapData(exprData, get_assay(param))
                     +              filteredMappedGeneSets <- .filterAndMapGeneSets(param=param,
                     +                                                              filteredDataMatrix=filteredDataMatrix,
                     +                                                              verbose=verbose)
                                    if (!inherits(BPPARAM, "SerialParam") && verbose) {
                                        msg <- sprintf("Using a %s parallel back-end with %d workers",
@@ -570,12 +530,13 @@ setMethod("gsvaScores", signature(param="gsvaParam", ranks="GsvaExprData"),
                                    if (verbose)
                                        cli_alert_info(sprintf("Calculating GSVA scores"))
                     -              gsva_es <- .compute_gsva_scores(R=unwrapData(ranks),
                     +              gsva_es <- .compute_gsva_scores(R=filteredDataMatrix,
                                                                    geneSetsIdx=filteredMappedGeneSets,
                     -                                              tau=tau, maxDiff=maxDiff,
                     -                                              absRanking=absRanking,
                     -                                              sparse=sparse, verbose=verbose,
                     -                                              BPPARAM=BPPARAM)
                     +                                              tau=get_tau(param),
                     +                                              maxDiff=get_maxDiff(param),
                     +                                              absRanking=get_absRanking(param),
                     +                                              sparse=get_sparse(param),
                     +                                              verbose=verbose, BPPARAM=BPPARAM)
                                    rownames(gsva_es) <- names(filteredMappedGeneSets)
                                    colnames(gsva_es) <- colnames(filteredDataMatrix)
@@ -590,9 +551,144 @@ setMethod("gsvaScores", signature(param="gsvaParam", ranks="GsvaExprData"),
                                    return(rval)
                                })
                     +#' @title GSVA enrichment data and visualization
                     +#'
                     +#' @description Extract and plot enrichment data from GSVA scores.
                     +#'
                     +#' @param param A [`gsvaRanksParam-class`] object obtained with the method
                     +#' [`gsvaRanks`].
                     +#'
                     +#' @param column The column for which we want to retrieve the enrichment data.
                     +#' This parameter is only available in the `gsvaEnrichment()` method.
                     +#'
                     +#' @param geneSet Either a positive integer number between 1 and the number of
                     +#' available gene sets in `param`, or a character string with the name of
                     +#' one of the gene sets available in `param`.
                     +#'
                     +#' @param plot A character string indicating whether an enrichment plot should
                     +#' be produced using either base R graphics (`plot="base"`) or the ggplot2 package
                     +#' (`plot="ggplot"`), or not (`plot="no"`). In the latter case, the enrichment
                     +#' data will be returned. By default `plot="auto"`, which implies that if this
                     +#' method is called from an interactive session, a plot using base R graphics
                     +#' will be produced and, otherwise, the enrichment data is returned.
                     +#'
                     +#' @param ... Further arguments passed to the `plot()` function when the
                     +#' previous parameter `plot="base"`.
                     +#'
                     +#' @return When `plot="no"`, this method returns the enrichment data. When
                     +#' `plot="ggplot"`, this method returns a `ggplot` object. When `plot="base"`
                     +#' no value is returned.
                     +#'
                     +#' @aliases gsvaEnrichment,gsvaRanksParam-method
                     +#' @name gsvaEnrichment
                     +#' @rdname gsvaEnrichment
                     +#'
                     +#' @references Hänzelmann, S., Castelo, R. and Guinney, J. GSVA: Gene set
                     +#' variation analysis for microarray and RNA-Seq data.
                     +#' *BMC Bioinformatics*, 14:7, 2013.
                     +#' [DOI](https://doi.org/10.1186/1471-2105-14-7)
                     +#'
                     +#' @examples
                     +#' library(GSVA)
                     +#'
                     +#' p <- 10 ## number of genes
                     +#' n <- 30 ## number of samples
                     +#' nGrp1 <- 15 ## number of samples in group 1
                     +#' nGrp2 <- n - nGrp1 ## number of samples in group 2
                     +#'
                     +#' ## consider three disjoint gene sets
                     +#' geneSets <- list(gset1=paste0("g", 1:3),
                     +#'                  gset2=paste0("g", 4:6),
                     +#'                  gset3=paste0("g", 7:10))
                     +#'
                     +#' ## sample data from a normal distribution with mean 0 and st.dev. 1
                     +#' y <- matrix(rnorm(n*p), nrow=p, ncol=n,
                     +#'             dimnames=list(paste("g", 1:p, sep="") , paste("s", 1:n, sep="")))
                     +#'
                     +#' ## genes in set1 are expressed at higher levels in the last 'nGrp1+1' to 'n' samples
                     +#' y[geneSets$set1, (nGrp1+1):n] <- y[geneSets$set1, (nGrp1+1):n] + 2
                     +#'
                     +#' ## build GSVA parameter object
                     +#' gsvapar <- gsvaParam(y, geneSets)
                     +#'
                     +#' ## calculate GSVA ranks
                     +#' gsvarankspar <- gsvaRanks(gsvapar)
                     +#' gsvarankspar
                     +#'
                     +#' ## by default the enrichment data for the first column and the first
                     +#' ## gene set are retrieved
                     +#' gsvaEnrichment(gsvarankspar)
                     +#'
                     +#' @importFrom cli cli_alert_info cli_abort cli_alert_danger
                     +#' @exportMethod gsvaScores
                     +setMethod("gsvaEnrichment", signature(param="gsvaRanksParam"),
                     +          function(param, column=1, geneSet=1,
                     +                   plot=c("auto", "base", "ggplot", "no"), ...)
                     +          {
                     +              plot <- match.arg(plot)
+                    +
                     +              geneSets <- get_geneSets(param)
                     +              if (length(geneSet) > 1) {
                     +                  msg <- paste("Please provide only the name or position of a",
                     +                               "single gene set.")
                     +                  cli_abort("x"=msg)
                     +              }
                     +              if (is.character(geneSet)) {
                     +                  if (!geneSet %in% names(geneSets)) {
                     +                      msg <- paste("Gene set %s is missing from the input",
                     +                                   "parameter object")
                     +                      cli_abort("x"=sprintf(msg, geneSet))
                     +                  }
                     +              } else if (is.integer(geneSet) || is.numeric(geneSet)) {
                     +                  if (geneSet < 1 || geneSet > length(geneSets)) {
                     +                       msg <- paste("When 'geneSet' is numeric, it should be a",
                     +                                    "number between 1 and the number of gene",
                     +                                    "sets (%d).")
                     +                       cli_abort("x"=sprintf(msg, length(geneSets)))
                     +                  }
                     +              } else {
                     +                  msg <- paste("'geneSet' should be either numeric or",
                     +                               "character.")
                     +                  cli_abort("x"=msg)
                     +              }
+                    +
                     +              tau <- get_tau(param)
                     +              maxDiff <- get_maxDiff(param)
                     +              absRanking <- get_absRanking(param)
                     +              sparse <- get_sparse(param)
+                    +
                     +              exprData <- get_exprData(param)
                     +              filteredDataMatrix <- unwrapData(exprData, get_assay(param))
+                    +
                     +              ## no need for verbosity when mapping a single gene set
                     +              filteredMappedGeneSets <- .filterAndMapGeneSets(param, wgset=geneSet,
                     +                                                              filteredDataMatrix,
                     +                                                              verbose=FALSE)
+                    +
                     +              geneSetIdx <- filteredMappedGeneSets[[1]]
                     +              edata <- .gsva_enrichment_data(R=filteredDataMatrix,
                     +                                             column=column,
                     +                                             geneSetIdx=geneSetIdx,
                     +                                             tau=tau, maxDiff=maxDiff,
                     +                                             absRanking=absRanking,
                     +                                             sparse=sparse)
+                    +
                     +              if (plot == "no" || (plot == "auto" && !interactive()))
                     +                  return(edata)
+                    +
                     +              if (plot == "auto" || plot == "base")
                     +                  .plot_enrichment_base(edata, ...)
                     +              else { ## plot == "ggplot"
                     +                  instpkgs <- installed.packages(noCache=TRUE)[, "Package"]
                     +                  if (!"ggplot2" %in% instpkgs)
                     +                      cli_alert_danger("Please install the ggplot2 package")
                     +                  else
                     +                      .plot_enrichment_ggplot(edata)
                     +              }
                     +          })
                     -## END exported methods (to be moved to 'gsvaNewAPI.R')
                     +## END exported methods (to be moved to 'gsvaNewAPI.R')
                      #' @importFrom cli cli_progress_update
                      #' @importFrom parallel splitIndices
@@ -799,6 +895,125 @@ setMethod("gsvaScores", signature(param="gsvaParam", ranks="GsvaExprData"),
                          return(es)
+                     }
                     +.gsva_enrichment_data <- function(R, column, geneSetIdx, tau=1, maxDiff=TRUE,
                     +                                  absRanking=FALSE, sparse=TRUE) {
                     +    n <- ncol(R)
                     +    es <- NULL
                     +    if (!is(R, "dgCMatrix"))
                     +        sparse <- FALSE
+                    +
                     +    rnkstats <- .ranks2stats(R[, column], sparse)
                     +    walkStat <- .gsvaRndWalk2(geneSetIdx, rnkstats$dos, rnkstats$srs, tau)
                     +    maxDev <- c(max(c(0, max(walkStat))), min(c(0, min(walkStat))))
                     +    whMaxDev <- c(which.max(walkStat), which.min(walkStat))
                     +    whMaxDev[maxDev == 0] <- NA
+                    +
                     +    if (maxDiff && absRanking)
                     +        maxDev[2] <- -1 * maxDev[2]
                     +    sco <- sum(maxDev)
                     +    if (!maxDiff) {
                     +        sco <- maxDev[1]
                     +        if (abs(maxDev[2]) > maxDev[1])
                     +            sco <- maxDev[2]
                     +    }
+                    +
                     +    edat <- data.frame(rank=seq.int(nrow(R)),
                     +                       stat=walkStat)
                     +    rownames(edat)[rnkstats$dos] <- rownames(R)
+                    +
                     +    gsetrnk <- rnkstats$dos[geneSetIdx]
                     +    lepos <- leneg <- NA
                     +    if (!is.na(whMaxDev[1]))
                     +        lepos <- geneSetIdx[gsetrnk <= whMaxDev[1]]
                     +    if (!is.na(whMaxDev[2])) {
                     +        if (!is.na(whMaxDev[1]) && whMaxDev[2] < whMaxDev[1]) {
                     +            mask <- gsetrnk >= whMaxDev[2] & gsetrnk <= whMaxDev[1]
                     +            lepos <- leneg <- geneSetIdx[mask]
                     +        } else
                     +            leneg <- geneSetIdx[gsetrnk >= whMaxDev[2]]
                     +    }
                     +    res <- list(stats=edat,
                     +                gsetrnk=gsetrnk,
                     +                maxPos=maxDev[1],
                     +                whichMaxPos=whMaxDev[1],
                     +                maxNeg=maxDev[2],
                     +                whichMaxNeg=whMaxDev[2],
                     +                leadingEdgePos=lepos,
                     +                leadingEdgeNeg=leneg,
                     +                score=sco,
                     +                tau=tau,
                     +                maxDiff=maxDiff,
                     +                absRanking=absRanking,
                     +                sparse=sparse)
+                    +
                     +    return(res)
                     +}
+                    +
                     +#' @importFrom graphics abline grid lines segments
                     +.plot_enrichment_base <- function(edata, ...) {
                     +    ylim <- range(edata$stats$stat)
                     +    hgsetticks <- (ylim[2] - ylim[1]) * 0.1
                     +    plot(edata$stats, type="l", lwd=2, las=1, panel.first=grid(),
                     +         xlab="Gene Ranking", ylab="Random Walk Statistic", col="green", ...)
                     +    abline(h=0, lwd=2, lty=2, col="grey")
                     +    lines(edata$stats, lwd=2, col="green")
                     +    segments(edata$gsetrnk, -hgsetticks/2, edata$gsetrnk, hgsetticks/2, lwd=2)
                     +    if (!is.na(edata$whichMaxPos) &&
                     +        (edata$maxDiff || edata$maxPos >= abs(edata$maxNeg)))
                     +        segments(edata$whichMaxPos, 0, edata$whichMaxPos, edata$maxPos,
                     +                 lwd=2, lty=2, col="darkred")
                     +    if (!is.na(edata$whichMaxNeg) &&
                     +        (edata$maxDiff || edata$maxPos < abs(edata$maxNeg)))
                     +        segments(edata$whichMaxNeg, 0, edata$whichMaxNeg, edata$maxNeg,
                     +                 lwd=2, lty=2, col="darkred")
                     +}
+                    +
                     +#' @importFrom cli cli_abort
                     +#' @importFrom utils globalVariables
                     +.plot_enrichment_ggplot <- function(edata, ...) {
                     +    if (!.isPackageLoaded("ggplot2")) {
                     +        loaded <- suppressPackageStartupMessages(requireNamespace("ggplot2"))
                     +        if (!loaded)
                     +            cli_abort("x"="ggplot2 could not be loaded")
                     +    }
+                    +
                     +    ylim <- range(edata$stats$stat)
                     +    hgsetticks <- (ylim[2] - ylim[1]) * 0.1
                     +    gsetticks <- data.frame(gsetrnk=edata$gsetrnk)
                     +    ## from https://stackoverflow.com/a/39877048
                     +    fintticks <- function(x) unique(floor(pretty(seq(min(x),
                     +                                    (max(x) + 1) * 1.1))))
                     +    ggplot2::ggplot(data=edata$stats) +
                     +        ggplot2::scale_x_continuous(breaks=fintticks) +
                     +        ggplot2::geom_line(ggplot2::aes_string(x="rank", y="stat"), color="green") +
                     +        ggplot2::geom_segment(data=gsetticks,
                     +                     mapping=ggplot2::aes_string(x="gsetrnk", y=-hgsetticks/2,
                     +                                 xend="gsetrnk", yend=hgsetticks/2),
                     +                     linewidth=1) +
                     +        ggplot2::geom_hline(yintercept=0, colour="grey", linetype="dashed") +
                     +        { if (!is.na(edata$whichMaxPos) &&
                     +              (edata$maxDiff || edata$maxPos >= abs(edata$maxNeg)))
                     +              ggplot2::geom_segment(data=data.frame(whichMaxPos=edata$whichMaxPos,
                     +                                           maxPos=edata$maxPos),
                     +                           mapping=ggplot2::aes_string(x="whichMaxPos", y=0,
                     +                                       xend="whichMaxPos", yend="maxPos"),
                     +                           colour="darkred", linetype="dashed") } +
                     +        { if (!is.na(edata$whichMaxPos) &&
                     +              (edata$maxDiff || edata$maxPos < abs(edata$maxNeg)))
                     +              ggplot2::geom_segment(data=data.frame(whichMaxNeg=edata$whichMaxNeg,
                     +                                           maxNeg=edata$maxNeg),
                     +                           mapping=ggplot2::aes_string(x="whichMaxNeg", y=0,
                     +                                       xend="whichMaxNeg", yend="maxNeg"),
                     +                           colour="darkred", linetype="dashed") } +
                     +        ggplot2::theme(panel.background=ggplot2::element_blank(),
                     +              panel.grid.major=ggplot2::element_line(colour="grey", linetype="dotted"),
                     +              panel.grid.minor=ggplot2::element_line(colour=NA),
                     +              axis.text=ggplot2::element_text(size=12),
                     +              axis.title=ggplot2::element_text(size=14),
                     +              panel.border=ggplot2::element_rect(colour="black", fill=NA)) +
                     +        ggplot2::labs(x="Gene Ranking", y="Random Walk Statistic")
                     +}
+                    +
                      ##
                      ## functions interfacing C code
                      ##

R/gsvaNewAPI.R

History View file @ 1d874ee01

@@ -1094,13 +1094,15 @@ setMethod("unwrapData", signature("SpatialExperiment"),
                      ## wrapData: put the resulting data and gene sets into the original data container type
                      setMethod("wrapData", signature(container="matrix"),
                                function(container, dataMatrix, geneSets) {
                     -              attr(dataMatrix, "geneSets") <- geneSets
                     +              if (!missing(geneSets))
                     +                  attr(dataMatrix, "geneSets") <- geneSets
                                    return(dataMatrix)
                                })
                      setMethod("wrapData", signature(container="dgCMatrix"),
                                function(container, dataMatrix, geneSets) {
                     -              attr(dataMatrix, "geneSets") <- geneSets
                     +              if (!missing(geneSets))
                     +                  attr(dataMatrix, "geneSets") <- geneSets
                                    return(dataMatrix)
                                })
@@ -1110,45 +1112,79 @@ setMethod("wrapData", signature(container="ExpressionSet"),
                                                phenoData=phenoData(container),
                                                experimentData=experimentData(container),
                                                annotation="")
                     -              attr(rval, "geneSets") <- geneSets
                     +              if (!missing(geneSets))
                     +                  attr(rval, "geneSets") <- geneSets
                                    return(rval)
                                })
                      setMethod("wrapData", signature(container="SummarizedExperiment"),
                                function(container, dataMatrix, geneSets) {
                     +              rdata <- adata <- NULL
                     +              if (!missing(geneSets)) {
                     +                  adata <- SimpleList(es=dataMatrix)
                     +                  rdata <- DataFrame(gs=CharacterList(geneSets))
                     +              } else { ## assume missing geneSets imples dataMatrix are ranks
                     +                  mask <- rownames(container) %in% rownames(dataMatrix)
                     +                  adata <- c(assays(container[mask, ]),
                     +                             SimpleList(gsvaranks=dataMatrix))
                     +                  rdata <- rowData(container)[mask, ]
                     +              }
                                    rval <- SummarizedExperiment(
                     -                  assays=SimpleList(es=dataMatrix),
                     +                  assays=adata,
                                        colData=colData(container),
                     -                  rowData=DataFrame(gs=CharacterList(geneSets)),
                     +                  rowData=rdata,
                                        metadata=metadata(container))
                     -              metadata(rval)$annotation <- NULL
                     +              if (!missing(geneSets))
                     +                  metadata(rval)$annotation <- NULL
                                    return(rval)
                                })
                      setMethod("wrapData", signature(container="SingleCellExperiment"),
                                function(container, dataMatrix, geneSets) {
                     +              rdata <- adata <- NULL
                     +              if (!missing(geneSets)) {
                     +                  adata <- SimpleList(es=dataMatrix)
                     +                  rdata <- DataFrame(gs=CharacterList(geneSets))
                     +              } else { ## assume missing geneSets imples dataMatrix are ranks
                     +                  mask <- rownames(container) %in% rownames(dataMatrix)
                     +                  adata <- c(assays(container[mask, ]),
                     +                             SimpleList(gsvaranks=dataMatrix))
                     +                  rdata <- rowData(container)[mask, ]
                     +              }
                                    rval <- SingleCellExperiment(
                     -                  assays=SimpleList(es=dataMatrix),
                     +                  assays=adata,
                                        colData=colData(container),
                     -                  rowData=DataFrame(gs=CharacterList(geneSets)),
                     +                  rowData=rdata,
                                        metadata=metadata(container))
                     -              metadata(rval)$annotation <- NULL
                     +              if (!missing(geneSets))
                     +                  metadata(rval)$annotation <- NULL
                                    return(rval)
                                })
                      setMethod("wrapData", signature(container="SpatialExperiment"),
                                function(container, dataMatrix, geneSets) {
                     +              rdata <- adata <- NULL
                     +              if (!missing(geneSets)) {
                     +                  adata <- SimpleList(es=dataMatrix)
                     +                  rdata <- DataFrame(gs=CharacterList(geneSets))
                     +              } else { ## assume missing geneSets imples dataMatrix are ranks
                     +                  mask <- rownames(container) %in% rownames(dataMatrix)
                     +                  adata <- c(assays(container[mask, ]),
                     +                             SimpleList(gsvaranks=dataMatrix))
                     +                  rdata <- rowData(container)[mask, ]
                     +              }
                                    rval <- SpatialExperiment(
                     -                  assays=SimpleList(es=dataMatrix),
                     +                  assays=adata,
                                        colData=colData(container),
                     -                  rowData=DataFrame(gs=CharacterList(geneSets)),
                     +                  rowData=rdata,
                                        metadata=metadata(container),
                     -                  imgData = imgData(container),
                     -                  spatialCoords = spatialCoords(container))
                     -              metadata(rval)$annotation <- NULL
                     +                  imgData=imgData(container),
                     +                  spatialCoords=spatialCoords(container))
                     +              if (!missing(geneSets))
                     +                  metadata(rval)$annotation <- NULL
                                    return(rval)
                                })

R/gsvaParam.R

History View file @ 1d874ee01

@@ -287,3 +287,22 @@ setMethod("show",
                                    if ("dgCMatrix" %in% class(unwrapData(get_exprData(object), get_assay(object))))
                                        cat("sparse: ", get_sparse(object), "\n")
                                })
+                    +
                     +## ----- setters for gsvaRanksParam -----
+                    +
                     +#' @param object For the replacement method, an object of class
                     +#' [`gsvaRanksParam-class`].
                     +#'
                     +#' @param value For the replacement method, an object of the classes supported by
                     +#' [`GsvaGeneSets-class`].
                     +#'
                     +#' @aliases geneSets<-
                     +#' @aliases geneSets<-,gsvaRanksParam,GsvaGeneSets-method
                     +#' @rdname gsvaParam-class
                     +#' @exportMethod geneSets
                     +setReplaceMethod("geneSets", signature=signature(object="gsvaRanksParam",
                     +                                                 value="GsvaGeneSets"),
                     +                 function(object, value) {
                     +                   object@geneSets <- value
                     +                   object
                     +                 })

R/utils.R

History View file @ 1d874ee01

@@ -68,32 +68,35 @@
                      ## is a 'list' object with character string vectors as elements,
                      ## and 'features' is a character string vector object. it assumes
                      ## features in both input objects follow the same nomenclature,
+                    +
                     +#' @importFrom cli cli_abort
                      .mapGeneSetsToFeatures <- function(gsets, features) {
                     -  ## Aaron Lun's suggestion at
                     -  ## https://github.com/rcastelo/GSVA/issues/39#issuecomment-765549620
                     -  gsets2 <- CharacterList(gsets)
                     -  mt <- match(gsets2, features)
                     -  mapdgenesets <- as.list(mt[!is.na(mt)])
                     +    ## Aaron Lun's suggestion at
                     +    ## https://github.com/rcastelo/GSVA/issues/39#issuecomment-765549620
                     +    gsets2 <- CharacterList(gsets)
                     +    mt <- match(gsets2, features)
                     +    mapdgenesets <- as.list(mt[!is.na(mt)])
                     -  if (length(unlist(mapdgenesets, use.names=FALSE)) == 0)
                     -    stop("No identifiers in the gene sets could be matched to the identifiers in the expression data.")
                     +    if (length(unlist(mapdgenesets, use.names=FALSE)) == 0) {
                     +      msg <- paste("No identifiers in the gene sets could be matched to the",
                     +                   "identifiers in the expression data.")
                     +      cli_abort("x"=msg)
                     +    }
                     -  mapdgenesets
                     +    mapdgenesets
+                     }
                      ## it assumes that all arguments have been already checked for correctness
                     -.filterAndMapGeneSets <- function(param, geneSets, minSize, maxSize,
                     -                                  filteredDataMatrix, verbose) {
+                    -
                     -    ## if geneSets, minSize and maxSize are non-NA values, then they
                     -    ## override those coming from 'param' (b/c are provided by gsvaScores())
                     -    if (any(is.na(geneSets)))
                     -        geneSets <- get_geneSets(param)
                     -    if (is.na(minSize))
                     -        minSize <- get_minSize(param)
                     -    if (is.na(maxSize))
                     -        maxSize <- get_maxSize(param)
                     +#' @importFrom cli cli_abort
                     +.filterAndMapGeneSets <- function(param, wgset=NA, filteredDataMatrix, verbose) {
+                    +
                     +    geneSets <- get_geneSets(param)
                     +    if (!is.na(wgset))
                     +        geneSets <- geneSets[wgset]
+                    +
                     +    minSize <- get_minSize(param)
                     +    maxSize <- get_maxSize(param)
                          ## note that the method for 'GeneSetCollection' calls geneIds(), i.e.,
                          ## whatever the input, from here on we have a list of character vectors
@@ -113,11 +116,11 @@
                                                                   maxSize=maxSize)
                          if (length(filteredMappedGeneSets) == 0)
                     -        stop("The gene set list is empty! Filter may be too stringent.")
                     +        cli_abort("x"="The gene set list is empty! Filter may be too stringent.")
                          ## this should NEVER happen -- just to make sure it doesn't...
                          if (anyDuplicated(names(filteredMappedGeneSets)) > 0)
                     -        stop("The gene set list contains duplicated gene set names.")
                     +        cli_abort("x"="The gene set list contains duplicated gene set names.")
                          if (any(lengths(filteredMappedGeneSets) == 1)) {
                              msg <- "Some gene sets have size one. Consider setting minSize > 1"
@@ -141,9 +144,9 @@
                                                             removeConstant=removeConstant,
                                                             removeNzConstant=removeNzConstant)
                     -    filteredMappedGeneSets <- .filterAndMapGeneSets(param, NA, NA, NA,
                     -                                                    filteredDataMatrix,
                     -                                                    verbose)
                     +    filteredMappedGeneSets <- .filterAndMapGeneSets(param=param,
                     +                                                    filteredDataMatrix=filteredDataMatrix,
                     +                                                    verbose=verbose)
                          return(list(filteredDataMatrix=filteredDataMatrix,
                                      filteredMappedGeneSets=filteredMappedGeneSets))

inst/unitTests/test_gsvaRanks.R

History View file @ 1d874ee01

@@ -25,10 +25,10 @@ test_gsvaRanks <- function() {
                          ## calculate GSVA scores in two steps
                          ## first calculate GSVA ranks
                     -    gsva_ranks <- gsvaRanks(gsvapar, verbose=FALSE)
                     +    gsvarankspar <- gsvaRanks(gsvapar, verbose=FALSE)
                          ## second calculate GSVA scores using GSVA ranks
                     -    gsva_es2 <- gsvaScores(gsvapar, gsva_ranks, verbose=FALSE)
                     +    gsva_es2 <- gsvaScores(gsvarankspar, verbose=FALSE)
                          ## both approaches to calculate GSVA scores must give
                          ## the same result with the same input gene sets

man/gsvaEnrichment.Rd

History View file @ 1d874ee01

                     new file mode 100644
@@ -0,0 +1,82 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/gsva.R
                     +\name{gsvaEnrichment}
                     +\alias{gsvaEnrichment}
                     +\alias{gsvaEnrichment,gsvaRanksParam-method}
                     +\title{GSVA enrichment data and visualization}
                     +\usage{
                     +\S4method{gsvaEnrichment}{gsvaRanksParam}(
                     +  param,
                     +  column = 1,
                     +  geneSet = 1,
                     +  plot = c("auto", "base", "ggplot", "no"),
                     +  ...
                     +)
                     +}
                     +\arguments{
                     +\item{param}{A \code{\linkS4class{gsvaRanksParam}} object obtained with the method
                     +\code{\link{gsvaRanks}}.}
+                    +
                     +\item{column}{The column for which we want to retrieve the enrichment data.
                     +This parameter is only available in the \code{gsvaEnrichment()} method.}
+                    +
                     +\item{geneSet}{Either a positive integer number between 1 and the number of
                     +available gene sets in \code{param}, or a character string with the name of
                     +one of the gene sets available in \code{param}.}
+                    +
                     +\item{plot}{A character string indicating whether an enrichment plot should
                     +be produced using either base R graphics (\code{plot="base"}) or the ggplot2 package
                     +(\code{plot="ggplot"}), or not (\code{plot="no"}). In the latter case, the enrichment
                     +data will be returned. By default \code{plot="auto"}, which implies that if this
                     +method is called from an interactive session, a plot using base R graphics
                     +will be produced and, otherwise, the enrichment data is returned.}
+                    +
                     +\item{...}{Further arguments passed to the \code{plot()} function when the
                     +previous parameter \code{plot="base"}.}
                     +}
                     +\value{
                     +When \code{plot="no"}, this method returns the enrichment data. When
                     +\code{plot="ggplot"}, this method returns a \code{ggplot} object. When \code{plot="base"}
                     +no value is returned.
                     +}
                     +\description{
                     +Extract and plot enrichment data from GSVA scores.
                     +}
                     +\examples{
                     +library(GSVA)
+                    +
                     +p <- 10 ## number of genes
                     +n <- 30 ## number of samples
                     +nGrp1 <- 15 ## number of samples in group 1
                     +nGrp2 <- n - nGrp1 ## number of samples in group 2
+                    +
                     +## consider three disjoint gene sets
                     +geneSets <- list(gset1=paste0("g", 1:3),
                     +                 gset2=paste0("g", 4:6),
                     +                 gset3=paste0("g", 7:10))
+                    +
                     +## sample data from a normal distribution with mean 0 and st.dev. 1
                     +y <- matrix(rnorm(n*p), nrow=p, ncol=n,
                     +            dimnames=list(paste("g", 1:p, sep="") , paste("s", 1:n, sep="")))
+                    +
                     +## genes in set1 are expressed at higher levels in the last 'nGrp1+1' to 'n' samples
                     +y[geneSets$set1, (nGrp1+1):n] <- y[geneSets$set1, (nGrp1+1):n] + 2
+                    +
                     +## build GSVA parameter object
                     +gsvapar <- gsvaParam(y, geneSets)
+                    +
                     +## calculate GSVA ranks
                     +gsvarankspar <- gsvaRanks(gsvapar)
                     +gsvarankspar
+                    +
                     +## by default the enrichment data for the first column and the first
                     +## gene set are retrieved
                     +gsvaEnrichment(gsvarankspar)
+                    +
                     +}
                     +\references{
                     +Hänzelmann, S., Castelo, R. and Guinney, J. GSVA: Gene set
                     +variation analysis for microarray and RNA-Seq data.
                     +\emph{BMC Bioinformatics}, 14:7, 2013.
                     +\href{https://doi.org/10.1186/1471-2105-14-7}{DOI}
                     +}

man/gsvaParam-class.Rd

History View file @ 1d874ee01

@@ -3,7 +3,10 @@
                      \docType{class}
                      \name{gsvaParam-class}
                      \alias{gsvaParam-class}
                     +\alias{gsvaRanksParam-class}
                      \alias{gsvaParam}
                     +\alias{geneSets<-,gsvaRanksParam,GsvaGeneSets-method}
                     +\alias{geneSets<-}
                      \title{\code{gsvaParam} class}
                      \usage{
                      gsvaParam(
@@ -20,6 +23,8 @@ gsvaParam(
                        absRanking = FALSE,
                        sparse = TRUE
+                     )
+                    +
                     +\S4method{geneSets}{gsvaRanksParam,GsvaGeneSets}(object) <- value
+                     }
                      \arguments{
                      \item{exprData}{The expression data set.  Must be one of the classes
@@ -101,6 +106,12 @@ data in \code{exprData} is stored in a sparse matrix (e.g., a \code{dgCMatrix} o
                      In such a case, when \code{sparse=TRUE} (default), a sparse version of the GSVA
                      algorithm will be applied. Otherwise, when \code{sparse=FALSE}, the classical
                      version of the GSVA algorithm will be used.}
+                    +
                     +\item{object}{For the replacement method, an object of class
                     +\code{\linkS4class{gsvaRanksParam}}.}
+                    +
                     +\item{value}{For the replacement method, an object of the classes supported by
                     +\code{\linkS4class{GsvaGeneSets}}.}
+                     }
                      \value{
                      A new \code{\linkS4class{gsvaParam}} object.

man/gsvaRanks.Rd

History View file @ 1d874ee01

@@ -4,88 +4,40 @@
                      \alias{gsvaRanks}
                      \alias{gsvaRanks,gsvaParam-method}
                      \alias{gsvaScores}
                     -\alias{gsvaScores,gsvaParam,GsvaExprData-method}
                     +\alias{gsvaScores,gsvaRanksParam-method}
                      \title{GSVA ranks and scores}
                      \usage{
                      \S4method{gsvaRanks}{gsvaParam}(param, verbose = TRUE, BPPARAM = SerialParam(progressbar = verbose))
                     -\S4method{gsvaScores}{gsvaParam,GsvaExprData}(
                     -  param,
                     -  ranks,
                     -  geneSets = NA,
                     -  minSize = NA,
                     -  maxSize = NA,
                     -  tau = NA,
                     -  maxDiff = NA,
                     -  absRanking = NA,
                     -  verbose = TRUE,
                     -  BPPARAM = SerialParam(progressbar = verbose)
                     -)
                     +\S4method{gsvaScores}{gsvaRanksParam}(param, verbose = TRUE, BPPARAM = SerialParam(progressbar = verbose))
+                     }
                      \arguments{
                     -\item{param}{A \code{\link{gsvaParam}} object built using the constructor function
                     -\code{\link{gsvaParam}}.}
                     +\item{param}{A parameter object of the \code{\linkS4class{gsvaRanksParam}} class.}
                      \item{verbose}{Gives information about each calculation step. Default: \code{TRUE}.}
                      \item{BPPARAM}{An object of class \code{\link{BiocParallelParam}} specifying parameters
                      related to the parallel execution of some of the tasks and calculations
                      within this function.}
+                    -
                     -\item{ranks}{A matrix-like object storing GSVA ranks calculated with the
                     -method \code{\link{gsvaRanks}}.}
+                    -
                     -\item{geneSets}{A collection of gene sets. Must be one of the classes
                     -supported by \code{\linkS4class{GsvaGeneSets}}. For a list of these classes, see its
                     -help page using \code{help(GsvaGeneSets)}. By default, this parameter is set to
                     -the \code{NA} missing value, which means that GSVA scores will be calculated
                     -using the gene sets specified in the \code{param} argument. If this parameter is
                     -set to a non-missing value corresponding to an object of the classes
                     -supported by \code{\linkS4class{GsvaGeneSets}}, then GSVA scores will be calculated
                     -using the gene sets in this argument, instead of the ones specified in the
                     -\code{param} argument.}
+                    -
                     -\item{minSize}{Numeric vector of length 1.  Minimum size of the resulting gene
                     -sets after gene identifier mapping. Its default value is \code{NA}, indicating that
                     -this minimum value will be taken from the input \code{param} argument, otherwise,
                     -non-\code{NA} values override those from the input \code{param} argument.}
+                    -
                     -\item{maxSize}{Numeric vector of length 1.  Minimum size of the resulting gene
                     -sets after gene identifier mapping. Its default value is \code{NA}, indicating that
                     -this minimum value will be taken from the input \code{param} argument, otherwise,
                     -non-\code{NA} values override those from the input \code{param} argument.}
+                    -
                     -\item{tau}{Numeric vector of length 1.  The exponent defining the weight of
                     -the tail in the random walk performed by the \code{GSVA} (Hänzelmann et al.,
                     -2013) method.  The default value is 1 as described in the paper.}
+                    -
                     -\item{maxDiff}{Logical vector of length 1 which offers two approaches to
                     -calculate the enrichment statistic (ES) from the KS random walk statistic.
                     -\itemize{
                     -\item \code{FALSE}: ES is calculated as the maximum distance of the random walk
                     -from 0. This approach produces a distribution of enrichment scores that is
                     -bimodal, but it can give large enrichment scores to gene sets whose genes
                     -are not concordantly activated in one direction only.
                     -\item \code{TRUE} (the default): ES is calculated as the magnitude difference between
                     -the largest positive and negative random walk deviations. This default value
                     -gives larger enrichment scores to gene sets whose genes are concordantly
                     -activated in one direction only.
                     -}}
+                    -
                     -\item{absRanking}{Logical vector of length 1 used only when \code{maxDiff=TRUE}.
                     -When \code{absRanking=FALSE} (default) a modified Kuiper statistic is used to
                     -calculate enrichment scores, taking the magnitude difference between the
                     -largest positive and negative random walk deviations. When
                     -\code{absRanking=TRUE} the original Kuiper statistic that sums the largest
                     -positive and negative random walk deviations is used.}
+                     }
                      \value{
                     -In the case of the \code{gsvaRanks()} method, a matrix of GSVA rank
                     -values per column.
                     +In the case of the \code{gsvaRanks()} method, an object of class
                     +\code{\linkS4class{gsvaRanksParam}}.
                      In the case of the \code{gsvaScores()} method, a gene-set by sample matrix
                     -of GSVA enrichment scores stored in a ocntainer object of the same type as
                     -the input expression data container in the \code{param} argument.
                     +of GSVA enrichment scores stored in a container object of the same type as
                     +the input ranks data container. If
                     +the input was a base matrix or a \code{\linkS4class{dgCMatrix}} object, then the output will
                     +be a base matrix object with the gene sets employed in the calculations
                     +stored in an attribute called \code{geneSets}. If the input was an
                     +\code{\link{ExpressionSet}} object, then the output will be also an \code{\link{ExpressionSet}}
                     +object with the gene sets employed in the calculations stored in an
                     +attributed called \code{geneSets}. If the input was an object of one of the
                     +classes described in \code{\link{GsvaExprData}}, such as a \code{\link{SingleCellExperiment}},
                     +then the output will be of the same class, where enrichment scores will be
                     +stored in an assay called \code{es} and the gene sets employed in the
                     +calculations will be stored in the \code{rowData} slot of the object under the
                     +column name \code{gs}.
+                     }
                      \description{
                      Calculate GSVA scores in two steps: (1) calculate GSVA
@@ -109,14 +61,17 @@ geneSets <- list(gset1=paste0("g", 1:3),
                      y <- matrix(rnorm(n*p), nrow=p, ncol=n,
                                  dimnames=list(paste("g", 1:p, sep="") , paste("s", 1:n, sep="")))
                     +## genes in set1 are expressed at higher levels in the last 'nGrp1+1' to 'n' samples
                     +y[geneSets$set1, (nGrp1+1):n] <- y[geneSets$set1, (nGrp1+1):n] + 2
+                    +
                      ## build GSVA parameter object
                      gsvapar <- gsvaParam(y, geneSets)
                      ## calculate GSVA ranks
                     -gsva_ranks <- gsvaRanks(gsvapar)
                     -gsva_ranks
                     +gsvarankspar <- gsvaRanks(gsvapar)
                     +gsvarankspar
                      ## calculate GSVA scores
                     -gsva_es <- gsvaScores(gsvapar, gsva_ranks)
                     +gsva_es <- gsvaScores(gsvarankspar)
                      gsva_es
                      ## calculate now GSVA scores in a single step
@@ -130,7 +85,8 @@ geneSets2 <- list(gset1=paste0("g", 3:6),
                                        gset2=paste0("g", c(1, 2, 7, 8)))
                      ## note that there is no need to calculate the GSVA ranks again
                     -gsvaScores(gsvapar, gsva_ranks, geneSets2)
                     +geneSets(gsvarankspar) <- geneSets2
                     +gsvaScores(gsvarankspar)
+                     }
                      \references{
@@ -140,5 +96,5 @@ variation analysis for microarray and RNA-Seq data.
                      \href{https://doi.org/10.1186/1471-2105-14-7}{DOI}
+                     }
                      \seealso{
                     -\code{\link{gsvaParam}}, \code{\link{gsva}}
                     +\code{\linkS4class{gsvaParam}}, \code{\linkS4class{gsvaRanksParam}}, \code{\link{gsva}}
+                     }