Bioconductor Code: singleCellTK

Browse code

Use subsetSCECols to subset data in example

Yusuke Koga authored on 15/10/2020 17:11:54
Showing 36 changed files

R/celda_decontX.R index 42d43c38..3cd474d8 100644
R/doubletFinder_doubletDetection.R index e4607097..d7238fe1 100644
R/getUMAP.R index 0e7b942b..1f01c69f 100644
R/htmlReports.R index 859f342d..73d1e583 100644
R/plotDEAnalysis.R index d6ad1c2f..69f2a1db 100644
R/plotSCEHeatmap.R index dcd81799..3be94eb9 100644
R/plotUMAP.R index 90369534..f6a2a3c7 100644
R/runDEAnalysis.R index b4ceb7d3..dcb2ebb4 100644
R/runQC.R index fc8df910..74c86643 100644
R/sampleSummaryStats.R index 1b06dc17..13c4ce40 100644
R/scds_doubletdetection.R index 1aa1ddb7..c7696ed1 100644
R/scran_doubletCells.R index 81651929..b83fa4d8 100644
R/scrublet_doubletDetection.R index 77f40c37..308bc101 100644
man/getUMAP.Rd index a309686a..e13da336 100644
man/plotSCEHeatmap.Rd index 489620d4..746e18b5 100644
man/plotUMAP.Rd index 1a99ab8e..c697e8b7 100644
man/reportCellQC.Rd index 8fe2b083..12b2413c 100644
man/reportDiffExp.Rd index 29845c30..aa7abcd8 100644
man/reportQCTool.Rd index e73db029..e1d30a1f 100644
man/runANOVA.Rd index ea4ff50c..f5cf6b76 100644
man/runBcds.Rd index c5db1ad7..02ad220d 100644
man/runCxds.Rd index 76e21db8..d82dfaf5 100644
man/runCxdsBcdsHybrid.Rd index a6b040f0..e417c376 100644
man/runDEAnalysis.Rd index 716aa760..5e382870 100644
man/runDESeq2.Rd index b09c406b..4c3da784 100644
man/runDecontX.Rd index e9781c3e..7c3052a4 100644
man/runDoubletCells.Rd index 4e3fc4a3..1f7b2b52 100644
man/runDoubletFinder.Rd index 9456d69c..0f87c89c 100644
man/runLimmaDE.Rd index 39be5fd0..76cf5747 100644
man/runMAST.Rd index 329a80e1..97605050 100644
man/runScrublet.Rd index b5c272bc..8449810f 100644
man/sampleSummaryStats.Rd index a71ade98..7c36b93f 100644
tests/testthat/test-decontX.R index e808f243..5fa61f9a 100644
tests/testthat/test-mergeColData.R index 3ce2dffa..a7745635 100644
tests/testthat/test-misc.R index f364a6ed..fb58c43c 100644
tests/testthat/test-qc.R index d8da26c3..71c525c3 100644

History View file @ c06bc73b

@@ -49,14 +49,14 @@
                      #' @param logfile Character. Messages will be redirected to a file named
                      #'  `logfile`. If NULL, messages will be printed to stdout.  Default NULL.
                      #' @param verbose Logical. Whether to print log messages. Default TRUE.
                     -#'
                     +#'
                      #' @return A \link[SingleCellExperiment]{SingleCellExperiment} object with
                      #'  'decontX_Contamination' and 'decontX_Clusters' added to the
                      #'  \link[SummarizedExperiment]{colData} slot. Additionally, the
                      #' decontaminated counts will be added as an assay called 'decontXCounts'.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runDecontX(sce)
                      #' @export
                      runDecontX <- function(inSCE,
@@ -84,8 +84,8 @@ runDecontX <- function(inSCE,
                        message(paste0(date(), " ... Running 'DecontX'"))
                     -  inSCE <- celda::decontX(x = inSCE,
                     -                          batch = sample,
                     +  inSCE <- celda::decontX(x = inSCE,
                     +                          batch = sample,
                                                assayName = useAssay,
                                                z = z,
                                                maxIter = maxIter,
@@ -100,7 +100,7 @@ runDecontX <- function(inSCE,
                                                verbose = verbose)
                        #argsList <- argsList[!names(argsList) %in% ("...")]
+                    -
+                    +
                        inSCE@metadata$runDecontX <- argsList[-1]
                        inSCE@metadata$runDecontX$packageVersion <- utils::packageDescription("celda")$Version

R/doubletFinder_doubletDetection.R

History View file @ c06bc73b

@@ -330,7 +330,7 @@
                      #'  'doublet_finder_doublet_score'.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runDoubletFinder(sce)
                      #' @export
                      #' @importFrom SummarizedExperiment colData colData<-

R/getUMAP.R

History View file @ c06bc73b

@@ -1,115 +1,115 @@
                     -#' Uniform Manifold Approximation and Projection(UMAP) algorithm for
                     -#' dimension reduction.
                     -#'
                     -#' @param inSCE Input \linkS4class{SingleCellExperiment} object.
                     -#' @param useAssay Indicate which assay to use. The default is "counts".
                     -#' @param sample Character vector. Indicates which sample each cell belongs to.
                     -#' @param reducedDimName a name to store the results of the dimension reduction
                     -#' coordinates obtained from this method. This is stored in the SingleCellExperiment
                     -#' object in the reducedDims slot. Default "UMAP".
                     -#' @param logNorm Whether the counts will need to be log-normalized prior to
                     -#' generating the UMAP via scater::logNormCounts. Default TRUE.
                     -#' @param nNeighbors The size of local neighborhood used for
                     -#'   manifold approximation. Larger values result in more global
                     -#'   views of the manifold, while smaller values result in more
                     -#'   local data being preserved. Default 30.
                     -#'    See `?uwot::umap` for more information.
                     -#' @param nIterations number of iterations performed during layout optimization.
                     -#' Default is 200.
                     -#' @param alpha initial value of "learning rate" of layout optimization. Default is 1.
                     -#' @param minDist The effective minimum distance between embedded points.
                     -#'    Smaller values will result in a more clustered/clumped
                     -#'    embedding where nearby points on the manifold are drawn
                     -#'    closer together, while larger values will result on a more
                     -#'    even dispersal of points. Default 0.01.
                     -#'    See `?uwot::umap` for more information.
                     -#' @param spread The effective scale of embedded points. In combination with
                     -#'    ‘min_dist’, this determines how clustered/clumped the
                     -#'    embedded points are. Default 1.
                     -#'    See `?uwot::umap` for more information.
                     -#' @param pca Logical. Whether to perform dimensionality reduction with PCA
                     -#' before UMAP.
                     -#' @param initialDims  Number of dimensions from PCA to use as
                     -#' input in UMAP. Default 50.
                     -#'
                     -#' @return A \linkS4class{SingleCellExperiment} object with the reduced
                     -#' dimensions updated under reducedDimName specified.
                     -#' @export
                     -#'
                     -#' @examples
                     -#' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     -#' umap_res <- getUMAP(inSCE = sce, useAssay = "counts",
                     -#'                     reducedDimName = "UMAP", logNorm = TRUE,
                     -#'                     nNeighbors = 30, alpha = 1,
                     -#'                     nIterations = 200, spread = 1, pca = TRUE,
                     -#'                     initialDims = 50)
                     -#' reducedDims(umap_res)
+                    -
                     -getUMAP <- function(inSCE, useAssay = "counts",
                     -                    sample = NULL,
                     -                    reducedDimName = "UMAP",
                     -                    logNorm = TRUE,
                     -                    nNeighbors = 30,
                     -                    nIterations = 200,
                     -                    alpha = 1,
                     -                    minDist = 0.01,
                     -                    spread = 1,
                     -                    pca = TRUE,
                     -                    initialDims = 50) {
                     -  if (!inherits(inSCE, "SingleCellExperiment")){
                     -    stop("Please use a SingleCellExperiment object")
                     -  }
                     -  #test for assay existing
                     -    if (!all(useAssay %in% names(assays(inSCE)))){
                     -        stop("assay '", useAssay, "' does not exist.")
                     -    }
+                    -
                     -    if(!is.null(sample)) {
                     -        if(length(sample) != ncol(inSCE)) {
                     -            stop("'sample' must be the same length as the number of columns in 'inSCE'")
                     -        }
                     -    } else {
                     -        sample = rep(1, ncol(inSCE))
                     -    }
                     -    samples <- unique(sample)
                     -    umapDims = matrix(nrow = ncol(inSCE), ncol = 2)
                     -    for (i in seq_len(length(samples))){
                     -        useAssayTemp = useAssay
                     -	sceSampleInd <- sample == samples[i]
                     -        sceSample <- inSCE[, sceSampleInd]
                     -        if(logNorm){
                     -	    sceSample <- scater_logNormCounts(sceSample, useAssay = useAssay)
                     -            useAssayTemp = "ScaterLogNormCounts"
                     -        }
+                    -
                     -        matColData <- SummarizedExperiment::assay(sceSample, useAssayTemp)
                     -        matColData <- as.matrix(matColData)
+                    -
                     -        if (isTRUE(pca)) {
                     -          if(initialDims > ncol(matColData)){
                     -            doPCA <- ncol(matColData)
                     -          }else{
                     -            doPCA <- initialDims
                     -          }
                     -        } else {
                     -            doPCA <- NULL
                     -        }
                     -        if(nNeighbors > ncol(matColData)){
                     -          nNeighbors <- ncol(matColData)
                     -        }
+                    -
                     -        umapRes <- uwot::umap(t(matColData), n_neighbors = nNeighbors,
                     -                              learning_rate = alpha,
                     -                              min_dist = minDist, spread = spread,
                     -                              n_sgd_threads = 1, pca = doPCA,
                     -                              n_epochs = nIterations)
                     -        if (is.null(rownames(sceSample))) {
                     -            rownames(umapRes) <- colnames(sceSample)
                     -        }
                     -        umapDims[sceSampleInd, ] = umapRes
                     -    }
                     -    colnames(umapDims) <- c("UMAP1", "UMAP2")
                     -    SingleCellExperiment::reducedDim(inSCE, reducedDimName) <- umapDims
                     -    return(inSCE)
                     -}
                     +#' Uniform Manifold Approximation and Projection(UMAP) algorithm for
                     +#' dimension reduction.
                     +#'
                     +#' @param inSCE Input \linkS4class{SingleCellExperiment} object.
                     +#' @param useAssay Indicate which assay to use. The default is "counts".
                     +#' @param sample Character vector. Indicates which sample each cell belongs to.
                     +#' @param reducedDimName a name to store the results of the dimension reduction
                     +#' coordinates obtained from this method. This is stored in the SingleCellExperiment
                     +#' object in the reducedDims slot. Default "UMAP".
                     +#' @param logNorm Whether the counts will need to be log-normalized prior to
                     +#' generating the UMAP via scater::logNormCounts. Default TRUE.
                     +#' @param nNeighbors The size of local neighborhood used for
                     +#'   manifold approximation. Larger values result in more global
                     +#'   views of the manifold, while smaller values result in more
                     +#'   local data being preserved. Default 30.
                     +#'    See `?uwot::umap` for more information.
                     +#' @param nIterations number of iterations performed during layout optimization.
                     +#' Default is 200.
                     +#' @param alpha initial value of "learning rate" of layout optimization. Default is 1.
                     +#' @param minDist The effective minimum distance between embedded points.
                     +#'    Smaller values will result in a more clustered/clumped
                     +#'    embedding where nearby points on the manifold are drawn
                     +#'    closer together, while larger values will result on a more
                     +#'    even dispersal of points. Default 0.01.
                     +#'    See `?uwot::umap` for more information.
                     +#' @param spread The effective scale of embedded points. In combination with
                     +#'    ‘min_dist’, this determines how clustered/clumped the
                     +#'    embedded points are. Default 1.
                     +#'    See `?uwot::umap` for more information.
                     +#' @param pca Logical. Whether to perform dimensionality reduction with PCA
                     +#' before UMAP.
                     +#' @param initialDims  Number of dimensions from PCA to use as
                     +#' input in UMAP. Default 50.
                     +#'
                     +#' @return A \linkS4class{SingleCellExperiment} object with the reduced
                     +#' dimensions updated under reducedDimName specified.
                     +#' @export
                     +#'
                     +#' @examples
                     +#' data(scExample, package = "singleCellTK")
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                     +#' umap_res <- getUMAP(inSCE = sce, useAssay = "counts",
                     +#'                     reducedDimName = "UMAP", logNorm = TRUE,
                     +#'                     nNeighbors = 30, alpha = 1,
                     +#'                     nIterations = 200, spread = 1, pca = TRUE,
                     +#'                     initialDims = 50)
                     +#' reducedDims(umap_res)
+                    +
                     +getUMAP <- function(inSCE, useAssay = "counts",
                     +                    sample = NULL,
                     +                    reducedDimName = "UMAP",
                     +                    logNorm = TRUE,
                     +                    nNeighbors = 30,
                     +                    nIterations = 200,
                     +                    alpha = 1,
                     +                    minDist = 0.01,
                     +                    spread = 1,
                     +                    pca = TRUE,
                     +                    initialDims = 50) {
                     +  if (!inherits(inSCE, "SingleCellExperiment")){
                     +    stop("Please use a SingleCellExperiment object")
                     +  }
                     +  #test for assay existing
                     +    if (!all(useAssay %in% names(assays(inSCE)))){
                     +        stop("assay '", useAssay, "' does not exist.")
                     +    }
+                    +
                     +    if(!is.null(sample)) {
                     +        if(length(sample) != ncol(inSCE)) {
                     +            stop("'sample' must be the same length as the number of columns in 'inSCE'")
                     +        }
                     +    } else {
                     +        sample = rep(1, ncol(inSCE))
                     +    }
                     +    samples <- unique(sample)
                     +    umapDims = matrix(nrow = ncol(inSCE), ncol = 2)
                     +    for (i in seq_len(length(samples))){
                     +        useAssayTemp = useAssay
                     +	sceSampleInd <- sample == samples[i]
                     +        sceSample <- inSCE[, sceSampleInd]
                     +        if(logNorm){
                     +	    sceSample <- scater_logNormCounts(sceSample, useAssay = useAssay)
                     +            useAssayTemp = "ScaterLogNormCounts"
                     +        }
+                    +
                     +        matColData <- SummarizedExperiment::assay(sceSample, useAssayTemp)
                     +        matColData <- as.matrix(matColData)
+                    +
                     +        if (isTRUE(pca)) {
                     +          if(initialDims > ncol(matColData)){
                     +            doPCA <- ncol(matColData)
                     +          }else{
                     +            doPCA <- initialDims
                     +          }
                     +        } else {
                     +            doPCA <- NULL
                     +        }
                     +        if(nNeighbors > ncol(matColData)){
                     +          nNeighbors <- ncol(matColData)
                     +        }
+                    +
                     +        umapRes <- uwot::umap(t(matColData), n_neighbors = nNeighbors,
                     +                              learning_rate = alpha,
                     +                              min_dist = minDist, spread = spread,
                     +                              n_sgd_threads = 1, pca = doPCA,
                     +                              n_epochs = nIterations)
                     +        if (is.null(rownames(sceSample))) {
                     +            rownames(umapRes) <- colnames(sceSample)
                     +        }
                     +        umapDims[sceSampleInd, ] = umapRes
                     +    }
                     +    colnames(umapDims) <- c("UMAP1", "UMAP2")
                     +    SingleCellExperiment::reducedDim(inSCE, reducedDimName) <- umapDims
                     +    return(inSCE)
                     +}

R/htmlReports.R

History View file @ c06bc73b

@@ -47,7 +47,7 @@ reportDropletQC <- function(inSCE, output_file = NULL,
                      #' @return .html file
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' \dontrun{
                      #' sce <- runCellQC(sce)
                      #' reportCellQC(inSCE = sce)
@@ -84,7 +84,7 @@ reportCellQC <- function(inSCE, output_file = NULL,
                      #' @return .html file
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' \donttest{
                      #' sce <- runDecontX(sce)
                      #' sce <- getUMAP(sce)
@@ -165,12 +165,6 @@ reportQCTool <- function(inSCE, algorithm=c("BarcodeRankDrops",
                      #' @param output_dir name of the output directory to save the rendered file. If
                      #' \code{NULL} the file is stored to the current working directory.
                      #' Default \code{NULL}.
                     -#' @examples
                     -#' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     -#' sce <- runDEAnalysis(inSCE = sce, groupName1 = "Sample1", method = "DESeq2",
                     -#'  groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "DESeq2")
                     -#' reportDiffExp(sce, study = "DESeq2", output_file = "DESeq2_res")
                      #' @return .html file
                      #' @export
                      reportDiffExp <- function(inSCE, study,

R/plotDEAnalysis.R

History View file @ c06bc73b

@@ -262,7 +262,7 @@ plotDEGRegression <- function(inSCE, useResult, threshP = FALSE, labelBy = NULL,
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                      #' \dontrun{
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runDEAnalysis(inSCE = sce, groupName1 = "Sample1", method = "DESeq2",
                      #'  groupName2 = "Sample2", index1 = 1:100, index2 = 101:190, analysisName = "DESeq2")
                      #' plotDEGHeatmap(sce, useResult = "DESeq2", fdrThreshold = 1)

R/plotSCEHeatmap.R

History View file @ c06bc73b

@@ -177,7 +177,7 @@ dataAnnotationColor <- function(inSCE, axis = NULL,
                      #' @param ... Other arguments passed to \code{\link[ComplexHeatmap]{Heatmap}}.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' plotSCEHeatmap(sce[1:3,1:3])
                     +#' plotSCEHeatmap(sce[1:3,1:3], useAssay = "counts")
                      #' @return A \code{\link[ComplexHeatmap]{Heatmap}} object
                      #' @export
                      #' @author Yichen Wang

R/plotUMAP.R

History View file @ c06bc73b

@@ -15,7 +15,7 @@
                      #'
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- getUMAP(inSCE = sce, useAssay = "counts", reducedDimName = "UMAP")
                      #' plotUMAP(sce, shape = "No Shape", reducedDimName = "UMAP",
                      #'          runUMAP = TRUE, useAssay = "counts")

R/runDEAnalysis.R

History View file @ c06bc73b

@@ -127,7 +127,7 @@
                      #' \code{\link{runANOVA}}
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runDEAnalysis(inSCE = sce, groupName1 = "Sample1", method = "DESeq2",
                      #'  groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "DESeq2")
                      #' @return Input SCE object with \code{metadata(inSCE)} updated with name
@@ -190,7 +190,7 @@ runDEAnalysis <- function(method = 'MAST', ...){
                      #' Default \code{FALSE}.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runDESeq2(inSCE = sce, groupName1 = "Sample1",
                      #'  groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "DESeq2")
                      #'
@@ -317,7 +317,7 @@ runDESeq2 <- function(inSCE, useAssay = 'counts', index1 = NULL,
                      #' Default \code{FALSE}.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce@assays@data$logcounts <- log10(counts(sce) + 1)
                      #' sce <- runLimmaDE(inSCE = sce, groupName1 = "Sample1",
                      #'  groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "Limma")
@@ -440,7 +440,7 @@ runLimmaDE <- function(inSCE, useAssay = 'logcounts', index1 = NULL,
                      #' Default \code{FALSE}.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce@assays@data$logcounts <- log10(counts(sce) + 1)
                      #' sce <- runANOVA(inSCE = sce, groupName1 = "Sample1",
                      #'  groupName2 = "Sample2", index1 = 1:20, index2 = 21:40,
@@ -586,7 +586,7 @@ runANOVA <- function(inSCE, useAssay = 'logcounts', index1 = NULL,
                      #' Default \code{FALSE}.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce@assays@data$logcounts <- log10(counts(sce) + 1)
                      #' sce <- runMAST(inSCE = sce, groupName1 = "Sample1",
                      #'  groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "MAST")

R/runQC.R

History View file @ c06bc73b

@@ -20,7 +20,7 @@
                      #' of \code{inSCE}.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' \donttest{
                      #' sce <- runCellQC(sce)
                      #' }

R/sampleSummaryStats.R

History View file @ c06bc73b

@@ -118,7 +118,7 @@
                      #' QC stats stored in the inSCE.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sampleSummaryStats(sce, simple = TRUE)
                      #' @importFrom magrittr %>%
                      #' @export

R/scds_doubletdetection.R

History View file @ c06bc73b

@@ -23,7 +23,7 @@
                      #'  Please refer to the documentation of \link[scds]{cxds} for details.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runCxds(sce)
                      #' @export
                      #' @importFrom SummarizedExperiment colData colData<-
@@ -31,9 +31,9 @@
                      runCxds <- function(inSCE,
                          sample = NULL,
                          seed = 12345,
                     -    ntop = 500,
                     +    ntop = 500,
                          binThresh = 0,
                     -    verb = FALSE,
                     +    verb = FALSE,
                          retRes = FALSE,
                          estNdbl = FALSE,
                          useAssay = "counts") {
@@ -48,7 +48,7 @@ runCxds <- function(inSCE,
+                         }
                          message(paste0(date(), " ... Running 'cxds'"))
+                    -
+                    +
                          ## Getting current arguments
                          #argsList <- as.list(formals(fun = sys.function(sys.parent()), envir = parent.frame()))
                          argsList <- mget(names(formals()),sys.frame(sys.nframe()))
@@ -71,19 +71,19 @@ runCxds <- function(inSCE,
                              mat <- SummarizedExperiment::assay(sceSample, i = useAssay)
                              counts(sceSample) <- .convertToMatrix(mat)
+                    -
+                    +
                              result <- NULL
                              nGene <- 500
                              while(!inherits(result, "SingleCellExperiment") & nGene > 0) {
                                try({result <- withr::with_seed(seed, scds::cxds(sce = sceSample,
                     -                                                           ntop = nGene,
                     -                                                           binThresh = binThresh,
                     -                                                           verb = verb,
                     +                                                           ntop = nGene,
                     +                                                           binThresh = binThresh,
                     +                                                           verb = verb,
                                                                                 retRes = retRes,
                                                                                 estNdbl = estNdbl))}, silent = TRUE)
                                nGene <- nGene - 100
                     -        }
+                    -
                     +        }
+                    +
                              if (!inherits(result, "try-error") & !is.null(result)) {
                                if ("cxds_call" %in% colnames(SummarizedExperiment::colData(result))) {
                                    output[sceSampleInd, ] <- SummarizedExperiment::colData(result)[,
@@ -95,12 +95,12 @@ runCxds <- function(inSCE,
                              } else {
                                output[sceSampleInd, ] <- NA
                                warning(paste0("'cxds' from package 'scds' did not complete successfully for sample", samples[i]))
                     -        }
                     +        }
+                         }
                          colnames(output) <- paste0("scds_", colnames(output))
                          colData(inSCE) = cbind(colData(inSCE), output)
+                    -
+                    +
                          inSCE@metadata$runCxds <- argsList[-1]
                          inSCE@metadata$runCxds$packageVersion <- utils::packageDescription("scds")$Version
@@ -120,7 +120,7 @@ runCxds <- function(inSCE,
                      #'  separately. If NULL, then all cells will be processed together.
                      #'  Default NULL.
                      #' @param seed Seed for the random number generator. Default 12345.
                     -#' @param ntop See \link[scds]{bcds} for more information. Default \code{500}.
                     +#' @param ntop See \link[scds]{bcds} for more information. Default \code{500}.
                      #' @param srat See \link[scds]{bcds} for more information. Default \code{1}.
                      #' @param verb See \link[scds]{bcds} for more information. Default \code{FALSE}.
                      #' @param retRes See \link[scds]{bcds} for more information. Default \code{FALSE}.
@@ -135,7 +135,7 @@ runCxds <- function(inSCE,
                      #'  Please refer to the documentation of \link[scds]{bcds} for details.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runBcds(sce)
                      #' @export
                      #' @importFrom SummarizedExperiment colData colData<-
@@ -143,11 +143,11 @@ runCxds <- function(inSCE,
                      runBcds <- function(inSCE,
                          sample = NULL,
                          seed = 12345,
                     -    ntop = 500,
                     -    srat = 1,
                     +    ntop = 500,
                     +    srat = 1,
                          verb = FALSE,
                          retRes = FALSE,
                     -    nmax = "tune",
                     +    nmax = "tune",
                          varImp = FALSE,
                          estNdbl = FALSE,
                          useAssay = "counts"
@@ -163,7 +163,7 @@ runBcds <- function(inSCE,
+                         }
                          message(paste0(date(), " ... Running 'bcds'"))
+                    -
+                    +
                          ## Getting current arguments
                          #argsList <- as.list(formals(fun = sys.function(sys.parent()), envir = parent.frame()))
                          argsList <- mget(names(formals()),sys.frame(sys.nframe()))
@@ -186,22 +186,22 @@ runBcds <- function(inSCE,
                              mat <- SummarizedExperiment::assay(sceSample, i = useAssay)
                              counts(sceSample) <- .convertToMatrix(mat)
+                    -
+                    +
                              result <- NULL
                              nGene <- 500
                              while(!inherits(result, "SingleCellExperiment") & nGene > 0) {
                                try({result <- withr::with_seed(seed,
                                  scds::bcds(sce = sceSample,
                                             ntop = nGene,
                     -                       srat = srat,
                     +                       srat = srat,
                                             verb = verb,
                                             retRes = retRes,
                     -                       nmax = nmax,
                     +                       nmax = nmax,
                                             varImp = varImp,
                                             estNdbl = estNdbl
                                  ))}, silent = TRUE)
                                nGene <- nGene - 100
                     -        }
                     +        }
                              if (!inherits(result, "try-error") & !is.null(result)) {
                                if ("bcds_call" %in% colnames(SummarizedExperiment::colData(result))) {
@@ -214,13 +214,13 @@ runBcds <- function(inSCE,
                              } else {
                                output[sceSampleInd, ] <- NA
                                warning(paste0("'bcds' from package 'scds' did not complete successfully for sample", samples[i]))
                     -        }
+                    -
                     +        }
+                    +
+                         }
                          colnames(output) <- paste0("scds_", colnames(output))
                          colData(inSCE) = cbind(colData(inSCE), output)
+                    -
+                    +
                          inSCE@metadata$runBcds <- argsList[-1]
                          inSCE@metadata$runBcds$packageVersion <- utils::packageDescription("scds")$Version
@@ -241,7 +241,7 @@ runBcds <- function(inSCE,
                      #'  Default NULL.
                      #' @param seed Seed for the random number generator. Default 12345.
                      #' @param nTop The number of top varialbe genes to consider. Used in both \code{csds}
                     -#' and \code{bcds}. Default \code{500}.
                     +#' and \code{bcds}. Default \code{500}.
                      #' @param cxdsArgs See \link[scds]{cxds_bcds_hybrid} for more information. Default \code{NULL}.
                      #' @param bcdsArgs See \link[scds]{cxds_bcds_hybrid} for more information. Default \code{NULL}.
                      #' @param verb See \link[scds]{cxds_bcds_hybrid} for more information. Default \code{FALSE}.
@@ -256,7 +256,7 @@ runBcds <- function(inSCE,
                      #'  details.
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runCxdsBcdsHybrid(sce)
                      #' @export
                      #' @importFrom SummarizedExperiment colData colData<-
@@ -266,7 +266,7 @@ runCxdsBcdsHybrid <- function(inSCE,
                          seed = 12345,
                          nTop = 500,
                          cxdsArgs = list(),
                     -    bcdsArgs = list(),
                     +    bcdsArgs = list(),
                          verb = FALSE,
                          estNdbl = FALSE,
                          force = FALSE,
@@ -309,14 +309,14 @@ runCxdsBcdsHybrid <- function(inSCE,
                              result <- NULL
                              nGene <- 500
                              while(!inherits(result, "SingleCellExperiment") & nGene > 0) {
                     -          try({result <- withr::with_seed(seed, scds::cxds_bcds_hybrid(sce = sceSample,
                     -                                                                       cxdsArgs=c(list(ntop = nGene), cxdsArgs),
                     -                                                                       bcdsArgs=c(list(ntop = nGene), bcdsArgs),
                     +          try({result <- withr::with_seed(seed, scds::cxds_bcds_hybrid(sce = sceSample,
                     +                                                                       cxdsArgs=c(list(ntop = nGene), cxdsArgs),
                     +                                                                       bcdsArgs=c(list(ntop = nGene), bcdsArgs),
                                                                                             verb = verb,
                                                                                             estNdbl = estNdbl,
                                                                                             force = force))}, silent = TRUE)
                                nGene <- nGene - 100
                     -        }
                     +        }
                              if (!inherits(result, "try-error") & !is.null(result)) {
                                if ("hybrid_call" %in% colnames(SummarizedExperiment::colData(result))) {
@@ -329,12 +329,12 @@ runCxdsBcdsHybrid <- function(inSCE,
                              } else {
                                output[sceSampleInd, ] <- NA
                                warning(paste0("'cxds_bcds_hybrid' from package 'scds' did not complete successfully for sample", samples[i]))
                     -        }
                     +        }
+                         }
                          colnames(output) <- paste0("scds_", colnames(output))
                          colData(inSCE) = cbind(colData(inSCE), output)
+                    -
+                    +
                          inSCE@metadata$runCxdsBcdsHybrid <- argsList[-1]
                          inSCE@metadata$runCxdsBcdsHybrid$packageVersion <- utils::packageDescription("scds")$Version

R/scran_doubletCells.R

History View file @ c06bc73b

@@ -88,7 +88,7 @@
                      #' @seealso \link[scran]{doubletCells}
                      #' @examples
                      #' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      #' sce <- runDoubletCells(sce)
                      #' @export
                      #' @importFrom SummarizedExperiment colData colData<-

R/scrublet_doubletDetection.R

History View file @ c06bc73b

@@ -1,231 +1,231 @@
                     -#' @title Find doublets using \code{scrublet}.
                     -#' @description A wrapper function that calls \code{scrub_doublets} from python
                     -#'  module \code{scrublet}. Simulates doublets from the observed data and uses
                     -#'  a k-nearest-neighbor classifier to calculate a continuous
                     -#'  \code{scrublet_score} (between 0 and 1) for each transcriptome. The score
                     -#'  is automatically thresholded to generate \code{scrublet_call}, a boolean
                     -#'  array that is \code{TRUE} for predicted doublets and \code{FALSE}
                     -#'  otherwise.
                     -#' @param inSCE A \link[SingleCellExperiment]{SingleCellExperiment} object.
                     -#'  Needs \code{counts} in assays slot.
                     -#' @param sample Character vector. Indicates which sample each cell belongs to.
                     -#'  Scrublet will be run on cells from each sample separately. If NULL, then
                     -#'  all cells will be processed together. Default \code{NULL}.
                     -#' @param useAssay  A string specifying which assay in the SCE to use. Default
                     -#'  'counts'.
                     -#' @param simDoubletRatio Numeric. Number of doublets to simulate relative to
                     -#'  the number of observed transcriptomes. Default 2.0.
                     -#' @param nNeighbors Integer. Number of neighbors used to construct the KNN
                     -#'  graph of observed transcriptomes and simulated doublets. If \code{NULL},
                     -#'  this is set to \code{round(0.5 * sqrt(n_cells))}. Default \code{NULL}.
                     -#' @param minDist Float Determines how tightly UMAP packs points together. If \code{NULL},
                     -#'  this is set to 0.1. Default \code{NULL}.
                     -#' @param expectedDoubletRate The estimated doublet rate for the experiment.
                     -#'  Default 0.1.
                     -#' @param stdevDoubletRate Uncertainty in the expected doublet rate.
                     -#'  Default 0.02.
                     -#' @param syntheticDoubletUmiSubsampling Numeric. Rate for sampling UMIs
                     -#'  when creating synthetic doublets. If 1.0, each doublet is created by simply
                     -#'  adding the UMIs from two randomly sampled observed transcriptomes. For
                     -#'  values less than 1, the UMI counts are added and then randomly sampled at
                     -#'  the specified rate. Defuault: 1.0.
                     -#' @param useApproxNeighbors Boolean. Use approximate nearest neighbor method
                     -#'  (\code{annoy}) for the KNN classifier. Default \code{TRUE}.
                     -#' @param distanceMetric Character. Distance metric used when finding nearest
                     -#'  neighbors.
                     -#'  For list of valid values, see the documentation for \code{annoy} (if
                     -#'  \code{useApproxNeighbors} is \code{TRUE}) or
                     -#'  \code{sklearn.neighbors.NearestNeighbors} (if \code{useApproxNeighbors} is
                     -#'  \code{FALSE}). Default "euclidean".
                     -#' @param getDoubletNeighborParents Boolean. If \code{TRUE}, return the
                     -#'  parent transcriptomes that generated the doublet neighbors of each
                     -#'  observed transcriptome. This information can be used to infer the cell
                     -#'  states that generated a given doublet state. Default \code{FALSE}.
                     -#' @param minCounts Numeric. Used for gene filtering prior to PCA. Genes
                     -#'  expressed at fewer than \code{minCounts} in fewer than \code{minCells}
                     -#'  (see below) are excluded. Default 3.
                     -#' @param minCells Integer. Used for gene filtering prior to PCA. Genes
                     -#'  expressed at fewer than \code{minCounts} (see above) in fewer than
                     -#'  \code{minCells} are excluded. Default 3.
                     -#' @param minGeneVariabilityPctl Numeric. Used for gene filtering prior to
                     -#'  PCA. Keep the most highly variable genes (in the top
                     -#'  minGeneVariabilityPctl percentile), as measured by the v-statistic
                     -#'  (\emph{Klein et al., Cell 2015}). Default 85.
                     -#' @param logTransform Boolean. If \code{TRUE}, log-transform the counts matrix
                     -#'  (log10(1+TPM)). \code{sklearn.decomposition.TruncatedSVD} will be used for
                     -#'  dimensionality reduction, unless \code{meanCenter} is \code{TRUE}.
                     -#'  Default \code{FALSE}.
                     -#' @param meanCenter If \code{TRUE}, center the data such that each gene has a
                     -#'  mean of 0. \code{sklearn.decomposition.PCA} will be used for
                     -#'  dimensionality reduction. Default \code{TRUE}.
                     -#' @param normalizeVariance Boolean. If \code{TRUE}, normalize the data such
                     -#'  that each gene has a variance of 1.
                     -#'  \code{sklearn.decomposition.TruncatedSVD} will be used for dimensionality
                     -#'  reduction, unless \code{meanCenter} is \code{TRUE}. Default \code{TRUE}.
                     -#' @param nPrinComps Integer. Number of principal components used to embed
                     -#'  the transcriptomes prior to k-nearest-neighbor graph construction.
                     -#'  Default 30.
                     -#' @param tsneAngle Float. Determines angular size of a distant node as measured
                     -#'  from a point in the t-SNE plot. If default, it is set to 0.5 Default \code{NULL}.
                     -#' @param tsnePerplexity Integer. The number of nearest neighbors that
                     -#'  is used in other manifold learning algorithms.
                     -#'  If default, it is set to 30. Default \code{NULL}.
                     -#' @param verbose Boolean. If \code{TRUE}, print progress updates. Default
                     -#'  \code{TRUE}.
                     -#' @param seed Seed for the random number generator. Default 12345.
                     -#' @return A \link[SingleCellExperiment]{SingleCellExperiment} object with
                     -#'  \code{scrub_doublets} output appended to the
                     -#'  \link[SummarizedExperiment]{colData} slot. The columns include
                     -#'  \emph{scrublet_score} and \emph{scrublet_call}.
                     -#' @examples
                     -#' data(scExample, package = "singleCellTK")
                     -#' sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     -#' sce <- runScrublet(sce)
                     -#' @export
                     -#' @importFrom reticulate py_module_available py_set_seed import
                     -#' @importFrom SummarizedExperiment colData colData<-
                     -#' @importFrom SingleCellExperiment reducedDim
                     -runScrublet <- function(inSCE,
                     -  sample = NULL,
                     -  useAssay = "counts",
                     -  simDoubletRatio = 2.0,
                     -  nNeighbors = NULL,
                     -  minDist = NULL,
                     -  expectedDoubletRate = 0.1,
                     -  stdevDoubletRate = 0.02,
                     -  syntheticDoubletUmiSubsampling = 1.0,
                     -  useApproxNeighbors = TRUE,
                     -  distanceMetric = "euclidean",
                     -  getDoubletNeighborParents = FALSE,
                     -  minCounts = 3,
                     -  minCells = 3L,
                     -  minGeneVariabilityPctl = 85,
                     -  logTransform = FALSE,
                     -  meanCenter = TRUE,
                     -  normalizeVariance = TRUE,
                     -  nPrinComps = 30L,
                     -  tsneAngle = NULL,
                     -  tsnePerplexity = NULL,
                     -  verbose = TRUE,
                     -  seed = 12345) {
+                    -
                     -  if (!reticulate::py_module_available(module = "scrublet")) {
                     -    warning("Cannot find python module 'scrublet', please install Conda and",
                     -      " run sctkPythonInstallConda() or run sctkPythonInstallVirtualEnv().",
                     -      "If one of these have been previously run to install the modules,",
                     -      "make sure to run selectSCTKConda() or selectSCTKVirtualEnvironment(),",
                     -      " respectively, if R has been restarted since the module installation.",
                     -      " Alternatively, Scrublet can be installed on the local machine",
                     -      "with pip (e.g. pip install scrublet) and then the 'use_python()'",
                     -      " function from the 'reticulate' package can be used to select the",
                     -      " correct Python environment.")
                     -    return(inSCE)
                     -  }
+                    -
                     -  if (!is.null(seed)) {
                     -    reticulate::py_set_seed(seed = seed)
                     -  }
+                    -
                     -  if (!is.null(sample)) {
                     -    if (length(sample) != ncol(inSCE)) {
                     -      stop("'sample' must be the same length as the number of",
                     -        " columns in 'inSCE'")
                     -    }
                     -  } else {
                     -    sample = rep(1, ncol(inSCE))
                     -  }
+                    -
                     -  message(paste0(date(), " ... Running 'scrublet'"))
+                    -
                     -  ##  Getting current arguments values
                     -  #argsList <- as.list(formals(fun = sys.function(sys.parent()), envir = parent.frame()))
                     -  argsList <- mget(names(formals()),sys.frame(sys.nframe()))
+                    -
                     -  ## Define result matrix for all samples
                     -  output <- S4Vectors::DataFrame(row.names = colnames(inSCE),
                     -    scrublet_score = numeric(ncol(inSCE)),
                     -    scrublet_call = logical(ncol(inSCE)))
+                    -
                     -  ## Loop through each sample and run scrublet
                     -  error <- try({
                     -    samples <- unique(sample)
                     -    umapDims <- matrix(ncol = 2,
                     -                       nrow = ncol(inSCE))
                     -    rownames(umapDims) = colnames(inSCE)
                     -    colnames(umapDims) = c("UMAP_1", "UMAP_2")
+                    -
                     -    tsneDims <- matrix(ncol = 2,
                     -                       nrow = ncol(inSCE))
                     -    rownames(tsneDims) = colnames(inSCE)
                     -    colnames(tsneDims) = c("TSNE_1", "TSNE_2")
+                    -
                     -    for (i in seq_len(length(samples))) {
                     -      sceSampleInd <- sample == samples[i]
                     -      sceSample <- inSCE[, sceSampleInd]
+                    -
                     -      mat <- SummarizedExperiment::assay(sceSample, i = useAssay)
                     -      mat <- .convertToMatrix(mat)
+                    -
                     -      scr <- scrublet$Scrublet(counts_matrix = t(mat),
                     -        sim_doublet_ratio = simDoubletRatio,
                     -        n_neighbors = nNeighbors,
                     -        expected_doublet_rate = expectedDoubletRate,
                     -        stdev_doublet_rate = stdevDoubletRate)
+                    -
                     -      result <- scr$scrub_doublets(
                     -        synthetic_doublet_umi_subsampling = syntheticDoubletUmiSubsampling,
                     -        use_approx_neighbors = useApproxNeighbors,
                     -        distance_metric = distanceMetric,
                     -        get_doublet_neighbor_parents = getDoubletNeighborParents,
                     -        min_counts = minCounts,
                     -        min_cells = as.integer(minCells),
                     -        min_gene_variability_pctl = minGeneVariabilityPctl,
                     -        log_transform = logTransform,
                     -        mean_center = meanCenter,
                     -        normalize_variance = normalizeVariance,
                     -        n_prin_comps = as.integer(nPrinComps),
                     -        verbose = verbose)
+                    -
                     -      output[sceSampleInd, "scrublet_score"] <- result[[1]]
                     -      output[sceSampleInd, "scrublet_call"] <- result[[2]]
+                    -
                     -      ## Extract UMAP and TSNE coordinates
                     -      if (is.null(nNeighbors) && is.null(minDist)){
                     -        umap_coordinates <- scrublet$get_umap(scr$manifold_obs_)
                     -      }else {
                     -        umap_coordinates <- scrublet$get_umap(scr$manifold_obs_,
                     -                                              n_neighbors=as.integer(nNeighbors),
                     -                                              min_dist=minDist)
                     -      }
                     -      umapDims[sceSampleInd, ] <- umap_coordinates
+                    -
                     -    if (is.null(tsneAngle) && is.null(tsnePerplexity)){
                     -      tsne_coordinates <- scrublet$get_tsne(scr$manifold_obs_)
                     -    }else {
                     -      tsne_coordinates <- scrublet$get_tsne(scr$manifold_obs_,
                     -                                            angle=tsneAngle,
                     -                                            perplexity=as.integer(tsnePerplexity))
                     -    }
                     -    tsneDims[sceSampleInd, ] <- tsne_coordinates
+                    -
                     -  }
+                    -
                     -    colData(inSCE) = cbind(colData(inSCE), output)
                     -  }, silent = TRUE)
+                    -
                     -  if (inherits(error, "try-error")) {
                     -    warning("Scrublet did not complete successfully. Returning SCE without",
                     -      " making any changes. Error given by Scrublet: \n\n", error)
                     -  }
+                    -
                     -  inSCE@metadata$runScrublet <- argsList[-1]
+                    -
                     -  ## add scrublet version to metadata
                     -  version <- pkg_resources$require("scrublet")[[1]]
                     -  inSCE@metadata$scrublet$packageVersion <- version
                     -  reducedDim(inSCE,'scrublet_TSNE') <- tsneDims
                     -  reducedDim(inSCE,'scrublet_UMAP') <- umapDims
+                    -
                     -  return(inSCE)
                     -}
+                    -
                     +#' @title Find doublets using \code{scrublet}.
                     +#' @description A wrapper function that calls \code{scrub_doublets} from python
                     +#'  module \code{scrublet}. Simulates doublets from the observed data and uses
                     +#'  a k-nearest-neighbor classifier to calculate a continuous
                     +#'  \code{scrublet_score} (between 0 and 1) for each transcriptome. The score
                     +#'  is automatically thresholded to generate \code{scrublet_call}, a boolean
                     +#'  array that is \code{TRUE} for predicted doublets and \code{FALSE}
                     +#'  otherwise.
                     +#' @param inSCE A \link[SingleCellExperiment]{SingleCellExperiment} object.
                     +#'  Needs \code{counts} in assays slot.
                     +#' @param sample Character vector. Indicates which sample each cell belongs to.
                     +#'  Scrublet will be run on cells from each sample separately. If NULL, then
                     +#'  all cells will be processed together. Default \code{NULL}.
                     +#' @param useAssay  A string specifying which assay in the SCE to use. Default
                     +#'  'counts'.
                     +#' @param simDoubletRatio Numeric. Number of doublets to simulate relative to
                     +#'  the number of observed transcriptomes. Default 2.0.
                     +#' @param nNeighbors Integer. Number of neighbors used to construct the KNN
                     +#'  graph of observed transcriptomes and simulated doublets. If \code{NULL},
                     +#'  this is set to \code{round(0.5 * sqrt(n_cells))}. Default \code{NULL}.
                     +#' @param minDist Float Determines how tightly UMAP packs points together. If \code{NULL},
                     +#'  this is set to 0.1. Default \code{NULL}.
                     +#' @param expectedDoubletRate The estimated doublet rate for the experiment.
                     +#'  Default 0.1.
                     +#' @param stdevDoubletRate Uncertainty in the expected doublet rate.
                     +#'  Default 0.02.
                     +#' @param syntheticDoubletUmiSubsampling Numeric. Rate for sampling UMIs
                     +#'  when creating synthetic doublets. If 1.0, each doublet is created by simply
                     +#'  adding the UMIs from two randomly sampled observed transcriptomes. For
                     +#'  values less than 1, the UMI counts are added and then randomly sampled at
                     +#'  the specified rate. Defuault: 1.0.
                     +#' @param useApproxNeighbors Boolean. Use approximate nearest neighbor method
                     +#'  (\code{annoy}) for the KNN classifier. Default \code{TRUE}.
                     +#' @param distanceMetric Character. Distance metric used when finding nearest
                     +#'  neighbors.
                     +#'  For list of valid values, see the documentation for \code{annoy} (if
                     +#'  \code{useApproxNeighbors} is \code{TRUE}) or
                     +#'  \code{sklearn.neighbors.NearestNeighbors} (if \code{useApproxNeighbors} is
                     +#'  \code{FALSE}). Default "euclidean".
                     +#' @param getDoubletNeighborParents Boolean. If \code{TRUE}, return the
                     +#'  parent transcriptomes that generated the doublet neighbors of each
                     +#'  observed transcriptome. This information can be used to infer the cell
                     +#'  states that generated a given doublet state. Default \code{FALSE}.
                     +#' @param minCounts Numeric. Used for gene filtering prior to PCA. Genes
                     +#'  expressed at fewer than \code{minCounts} in fewer than \code{minCells}
                     +#'  (see below) are excluded. Default 3.
                     +#' @param minCells Integer. Used for gene filtering prior to PCA. Genes
                     +#'  expressed at fewer than \code{minCounts} (see above) in fewer than
                     +#'  \code{minCells} are excluded. Default 3.
                     +#' @param minGeneVariabilityPctl Numeric. Used for gene filtering prior to
                     +#'  PCA. Keep the most highly variable genes (in the top
                     +#'  minGeneVariabilityPctl percentile), as measured by the v-statistic
                     +#'  (\emph{Klein et al., Cell 2015}). Default 85.
                     +#' @param logTransform Boolean. If \code{TRUE}, log-transform the counts matrix
                     +#'  (log10(1+TPM)). \code{sklearn.decomposition.TruncatedSVD} will be used for
                     +#'  dimensionality reduction, unless \code{meanCenter} is \code{TRUE}.
                     +#'  Default \code{FALSE}.
                     +#' @param meanCenter If \code{TRUE}, center the data such that each gene has a
                     +#'  mean of 0. \code{sklearn.decomposition.PCA} will be used for
                     +#'  dimensionality reduction. Default \code{TRUE}.
                     +#' @param normalizeVariance Boolean. If \code{TRUE}, normalize the data such
                     +#'  that each gene has a variance of 1.
                     +#'  \code{sklearn.decomposition.TruncatedSVD} will be used for dimensionality
                     +#'  reduction, unless \code{meanCenter} is \code{TRUE}. Default \code{TRUE}.
                     +#' @param nPrinComps Integer. Number of principal components used to embed
                     +#'  the transcriptomes prior to k-nearest-neighbor graph construction.
                     +#'  Default 30.
                     +#' @param tsneAngle Float. Determines angular size of a distant node as measured
                     +#'  from a point in the t-SNE plot. If default, it is set to 0.5 Default \code{NULL}.
                     +#' @param tsnePerplexity Integer. The number of nearest neighbors that
                     +#'  is used in other manifold learning algorithms.
                     +#'  If default, it is set to 30. Default \code{NULL}.
                     +#' @param verbose Boolean. If \code{TRUE}, print progress updates. Default
                     +#'  \code{TRUE}.
                     +#' @param seed Seed for the random number generator. Default 12345.
                     +#' @return A \link[SingleCellExperiment]{SingleCellExperiment} object with
                     +#'  \code{scrub_doublets} output appended to the
                     +#'  \link[SummarizedExperiment]{colData} slot. The columns include
                     +#'  \emph{scrublet_score} and \emph{scrublet_call}.
                     +#' @examples
                     +#' data(scExample, package = "singleCellTK")
                     +#' sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                     +#' sce <- runScrublet(sce)
                     +#' @export
                     +#' @importFrom reticulate py_module_available py_set_seed import
                     +#' @importFrom SummarizedExperiment colData colData<-
                     +#' @importFrom SingleCellExperiment reducedDim
                     +runScrublet <- function(inSCE,
                     +  sample = NULL,
                     +  useAssay = "counts",
                     +  simDoubletRatio = 2.0,
                     +  nNeighbors = NULL,
                     +  minDist = NULL,
                     +  expectedDoubletRate = 0.1,
                     +  stdevDoubletRate = 0.02,
                     +  syntheticDoubletUmiSubsampling = 1.0,
                     +  useApproxNeighbors = TRUE,
                     +  distanceMetric = "euclidean",
                     +  getDoubletNeighborParents = FALSE,
                     +  minCounts = 3,
                     +  minCells = 3L,
                     +  minGeneVariabilityPctl = 85,
                     +  logTransform = FALSE,
                     +  meanCenter = TRUE,
                     +  normalizeVariance = TRUE,
                     +  nPrinComps = 30L,
                     +  tsneAngle = NULL,
                     +  tsnePerplexity = NULL,
                     +  verbose = TRUE,
                     +  seed = 12345) {
+                    +
                     +  if (!reticulate::py_module_available(module = "scrublet")) {
                     +    warning("Cannot find python module 'scrublet', please install Conda and",
                     +      " run sctkPythonInstallConda() or run sctkPythonInstallVirtualEnv().",
                     +      "If one of these have been previously run to install the modules,",
                     +      "make sure to run selectSCTKConda() or selectSCTKVirtualEnvironment(),",
                     +      " respectively, if R has been restarted since the module installation.",
                     +      " Alternatively, Scrublet can be installed on the local machine",
                     +      "with pip (e.g. pip install scrublet) and then the 'use_python()'",
                     +      " function from the 'reticulate' package can be used to select the",
                     +      " correct Python environment.")
                     +    return(inSCE)
                     +  }
+                    +
                     +  if (!is.null(seed)) {
                     +    reticulate::py_set_seed(seed = seed)
                     +  }
+                    +
                     +  if (!is.null(sample)) {
                     +    if (length(sample) != ncol(inSCE)) {
                     +      stop("'sample' must be the same length as the number of",
                     +        " columns in 'inSCE'")
                     +    }
                     +  } else {
                     +    sample = rep(1, ncol(inSCE))
                     +  }
+                    +
                     +  message(paste0(date(), " ... Running 'scrublet'"))
+                    +
                     +  ##  Getting current arguments values
                     +  #argsList <- as.list(formals(fun = sys.function(sys.parent()), envir = parent.frame()))
                     +  argsList <- mget(names(formals()),sys.frame(sys.nframe()))
+                    +
                     +  ## Define result matrix for all samples
                     +  output <- S4Vectors::DataFrame(row.names = colnames(inSCE),
                     +    scrublet_score = numeric(ncol(inSCE)),
                     +    scrublet_call = logical(ncol(inSCE)))
+                    +
                     +  ## Loop through each sample and run scrublet
                     +  error <- try({
                     +    samples <- unique(sample)
                     +    umapDims <- matrix(ncol = 2,
                     +                       nrow = ncol(inSCE))
                     +    rownames(umapDims) = colnames(inSCE)
                     +    colnames(umapDims) = c("UMAP_1", "UMAP_2")
+                    +
                     +    tsneDims <- matrix(ncol = 2,
                     +                       nrow = ncol(inSCE))
                     +    rownames(tsneDims) = colnames(inSCE)
                     +    colnames(tsneDims) = c("TSNE_1", "TSNE_2")
+                    +
                     +    for (i in seq_len(length(samples))) {
                     +      sceSampleInd <- sample == samples[i]
                     +      sceSample <- inSCE[, sceSampleInd]
+                    +
                     +      mat <- SummarizedExperiment::assay(sceSample, i = useAssay)
                     +      mat <- .convertToMatrix(mat)
+                    +
                     +      scr <- scrublet$Scrublet(counts_matrix = t(mat),
                     +        sim_doublet_ratio = simDoubletRatio,
                     +        n_neighbors = nNeighbors,
                     +        expected_doublet_rate = expectedDoubletRate,
                     +        stdev_doublet_rate = stdevDoubletRate)
+                    +
                     +      result <- scr$scrub_doublets(
                     +        synthetic_doublet_umi_subsampling = syntheticDoubletUmiSubsampling,
                     +        use_approx_neighbors = useApproxNeighbors,
                     +        distance_metric = distanceMetric,
                     +        get_doublet_neighbor_parents = getDoubletNeighborParents,
                     +        min_counts = minCounts,
                     +        min_cells = as.integer(minCells),
                     +        min_gene_variability_pctl = minGeneVariabilityPctl,
                     +        log_transform = logTransform,
                     +        mean_center = meanCenter,
                     +        normalize_variance = normalizeVariance,
                     +        n_prin_comps = as.integer(nPrinComps),
                     +        verbose = verbose)
+                    +
                     +      output[sceSampleInd, "scrublet_score"] <- result[[1]]
                     +      output[sceSampleInd, "scrublet_call"] <- result[[2]]
+                    +
                     +      ## Extract UMAP and TSNE coordinates
                     +      if (is.null(nNeighbors) && is.null(minDist)){
                     +        umap_coordinates <- scrublet$get_umap(scr$manifold_obs_)
                     +      }else {
                     +        umap_coordinates <- scrublet$get_umap(scr$manifold_obs_,
                     +                                              n_neighbors=as.integer(nNeighbors),
                     +                                              min_dist=minDist)
                     +      }
                     +      umapDims[sceSampleInd, ] <- umap_coordinates
+                    +
                     +    if (is.null(tsneAngle) && is.null(tsnePerplexity)){
                     +      tsne_coordinates <- scrublet$get_tsne(scr$manifold_obs_)
                     +    }else {
                     +      tsne_coordinates <- scrublet$get_tsne(scr$manifold_obs_,
                     +                                            angle=tsneAngle,
                     +                                            perplexity=as.integer(tsnePerplexity))
                     +    }
                     +    tsneDims[sceSampleInd, ] <- tsne_coordinates
+                    +
                     +  }
+                    +
                     +    colData(inSCE) = cbind(colData(inSCE), output)
                     +  }, silent = TRUE)
+                    +
                     +  if (inherits(error, "try-error")) {
                     +    warning("Scrublet did not complete successfully. Returning SCE without",
                     +      " making any changes. Error given by Scrublet: \n\n", error)
                     +  }
+                    +
                     +  inSCE@metadata$runScrublet <- argsList[-1]
+                    +
                     +  ## add scrublet version to metadata
                     +  version <- pkg_resources$require("scrublet")[[1]]
                     +  inSCE@metadata$scrublet$packageVersion <- version
                     +  reducedDim(inSCE,'scrublet_TSNE') <- tsneDims
                     +  reducedDim(inSCE,'scrublet_UMAP') <- umapDims
+                    +
                     +  return(inSCE)
                     +}
+                    +

man/getUMAP.Rd

History View file @ c06bc73b

@@ -73,7 +73,7 @@ dimension reduction.
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      umap_res <- getUMAP(inSCE = sce, useAssay = "counts",
                                          reducedDimName = "UMAP", logNorm = TRUE,
                                          nNeighbors = 30, alpha = 1,

man/plotSCEHeatmap.Rd

History View file @ c06bc73b

@@ -141,7 +141,7 @@ Plot heatmap of using data stored in SingleCellExperiment Object
 }
 \examples{
 data(scExample, package = "singleCellTK")
-plotSCEHeatmap(sce[1:3,1:3])
+plotSCEHeatmap(sce[1:3,1:3], useAssay = "counts")
 }
 \author{
 Yichen Wang

man/plotUMAP.Rd

History View file @ c06bc73b

@@ -37,7 +37,7 @@ Plot UMAP results either on already run results or run first and then plot.
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      sce <- getUMAP(inSCE = sce, useAssay = "counts", reducedDimName = "UMAP")
                      plotUMAP(sce, shape = "No Shape", reducedDimName = "UMAP",
                               runUMAP = TRUE, useAssay = "counts")

man/reportCellQC.Rd

History View file @ c06bc73b

@@ -32,7 +32,7 @@ A  function to generate .html Rmarkdown report containing the visualizations of
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      \dontrun{
                      sce <- runCellQC(sce)
                      reportCellQC(inSCE = sce)

man/reportDiffExp.Rd

History View file @ c06bc73b

@@ -28,10 +28,3 @@ Default \code{NULL}.}
                      A  function to generate .html Rmarkdown report containing the
                      visualizations of the \code{\link{runDEAnalysis}} function output
+                     }
                     -\examples{
                     -data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     -sce <- runDEAnalysis(inSCE = sce, groupName1 = "Sample1", method = "DESeq2",
                     - groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "DESeq2")
                     -reportDiffExp(sce, study = "DESeq2", output_file = "DESeq2_res")
                     -}

man/reportQCTool.Rd

History View file @ c06bc73b

@@ -32,7 +32,7 @@ A  function to generate .html Rmarkdown report for the specified QC algorithm ou
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      \donttest{
                      sce <- runDecontX(sce)
                      sce <- getUMAP(sce)

man/runANOVA.Rd

History View file @ c06bc73b

@@ -94,7 +94,7 @@ only.
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      sce@assays@data$logcounts <- log10(counts(sce) + 1)
                      sce <- runANOVA(inSCE = sce, groupName1 = "Sample1",
                       groupName2 = "Sample2", index1 = 1:20, index2 = 21:40,

man/runBcds.Rd

History View file @ c06bc73b

@@ -60,6 +60,6 @@ A wrapper function for \link[scds]{bcds}. Annotate
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runBcds(sce)
 }

man/runCxds.Rd

History View file @ c06bc73b

@@ -53,6 +53,6 @@ A wrapper function for \link[scds]{cxds}. Annotate
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runCxds(sce)
 }

man/runCxdsBcdsHybrid.Rd

History View file @ c06bc73b

@@ -59,6 +59,6 @@ A wrapper function for \link[scds]{cxds_bcds_hybrid}. Annotate
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runCxdsBcdsHybrid(sce)
 }

man/runDEAnalysis.Rd

History View file @ c06bc73b

@@ -26,7 +26,7 @@ Method supported: 'MAST', 'DESeq2', 'Limma', 'ANOVA'
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runDEAnalysis(inSCE = sce, groupName1 = "Sample1", method = "DESeq2",
  groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "DESeq2")
 }

man/runDESeq2.Rd

History View file @ c06bc73b

@@ -94,7 +94,7 @@ used.
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      sce <- runDESeq2(inSCE = sce, groupName1 = "Sample1",
                       groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "DESeq2")

man/runDecontX.Rd

History View file @ c06bc73b

@@ -96,6 +96,6 @@ A wrapper function for \link[celda]{decontX}. Identify
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runDecontX(sce)
 }

man/runDoubletCells.Rd

History View file @ c06bc73b

@@ -93,7 +93,7 @@ This function is a wrapper function for \link[scran]{doubletCells}.
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runDoubletCells(sce)
 }
 \references{

man/runDoubletFinder.Rd

History View file @ c06bc73b

@@ -54,6 +54,6 @@ Uses doubletFinder to determine cells within the dataset
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runDoubletFinder(sce)
 }

man/runLimmaDE.Rd

History View file @ c06bc73b

@@ -90,7 +90,7 @@ used.
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      sce@assays@data$logcounts <- log10(counts(sce) + 1)
                      sce <- runLimmaDE(inSCE = sce, groupName1 = "Sample1",
                       groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "Limma")

man/runMAST.Rd

History View file @ c06bc73b

@@ -90,7 +90,7 @@ used.
+                     }
                      \examples{
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      sce@assays@data$logcounts <- log10(counts(sce) + 1)
                      sce <- runMAST(inSCE = sce, groupName1 = "Sample1",
                       groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "MAST")

man/runScrublet.Rd

History View file @ c06bc73b

@@ -138,6 +138,6 @@ A wrapper function that calls \code{scrub_doublets} from python
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sce <- runScrublet(sce)
 }

man/sampleSummaryStats.Rd

History View file @ c06bc73b

@@ -24,6 +24,6 @@ Plot QC metrics generated from QC algorithms via either kable or csv file.
 }
 \examples{
 data(scExample, package = "singleCellTK")
-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
 sampleSummaryStats(sce, simple = TRUE)
 }

tests/testthat/test-decontX.R

History View file @ c06bc73b

@@ -2,7 +2,7 @@
                      library(singleCellTK)
                      context("Testing decontamination algorithms")
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      test_that(desc = "Testing runDecontX", {
                              sceres <- runDecontX(sce)

tests/testthat/test-mergeColData.R

History View file @ c06bc73b

@@ -3,16 +3,16 @@ context("Testing mergeSCColData")
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      colData(sce)$column_name = rownames(colData(sce))
                      test_that(desc = "Testing mergeSCEColData", {
                          sce2 <- sce
                          colData(sce2)$test <- 0
+                    -
+                    +
                          #test again
                          mergedsce <- mergeSCEColData(sce, sce2)
+                    -
+                    +
                          expect_equal(ncol(colData(sce)) + 1, ncol(colData(mergedsce)))
                      })

tests/testthat/test-misc.R

History View file @ c06bc73b

@@ -1,7 +1,7 @@
                      context("misc functions")
                      data(scExample, package = "singleCellTK")
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      test_that("summarizeSCE", {
                        ta <- summarizeSCE(sce, sample = NULL)

tests/testthat/test-qc.R

History View file @ c06bc73b

@@ -3,7 +3,7 @@ library(singleCellTK)
                      context("Testing dimensionality reduction algorithms")
                      data(scExample, package = "singleCellTK")
                      sceDroplet <- sce
                     -sce <- sce[, colData(sce)$type != 'EmptyDroplet']
                     +sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
                      sampleVector <- c(rep("Sample1", 100), rep("Sample2", 95))
                      sceres <- getUMAP(inSCE = sce, useAssay = "counts", logNorm = TRUE, sample = sampleVector, nNeighbors = 10, reducedDimName = "UMAP",
                                      nIterations = 20, alpha = 1, minDist = 0.01, pca = TRUE, initialDims = 20)

...	...	@@ -141,7 +141,7 @@ Plot heatmap of using data stored in SingleCellExperiment Object
141	141	}
142	142	\examples{
143	143	data(scExample, package = "singleCellTK")
144		-plotSCEHeatmap(sce[1:3,1:3])
	144	+plotSCEHeatmap(sce[1:3,1:3], useAssay = "counts")
145	145	}
146	146	\author{
147	147	Yichen Wang

...	...	@@ -60,6 +60,6 @@ A wrapper function for \link[scds]{bcds}. Annotate
60	60	}
61	61	\examples{
62	62	data(scExample, package = "singleCellTK")
63		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	63	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
64	64	sce <- runBcds(sce)
65	65	}

...	...	@@ -53,6 +53,6 @@ A wrapper function for \link[scds]{cxds}. Annotate
53	53	}
54	54	\examples{
55	55	data(scExample, package = "singleCellTK")
56		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	56	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
57	57	sce <- runCxds(sce)
58	58	}

...	...	@@ -59,6 +59,6 @@ A wrapper function for \link[scds]{cxds_bcds_hybrid}. Annotate
59	59	}
60	60	\examples{
61	61	data(scExample, package = "singleCellTK")
62		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	62	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
63	63	sce <- runCxdsBcdsHybrid(sce)
64	64	}

...	...	@@ -26,7 +26,7 @@ Method supported: 'MAST', 'DESeq2', 'Limma', 'ANOVA'
26	26	}
27	27	\examples{
28	28	data(scExample, package = "singleCellTK")
29		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	29	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
30	30	sce <- runDEAnalysis(inSCE = sce, groupName1 = "Sample1", method = "DESeq2",
31	31	groupName2 = "Sample2", index1 = 1:20, index2 = 21:40, analysisName = "DESeq2")
32	32	}

...	...	@@ -96,6 +96,6 @@ A wrapper function for \link[celda]{decontX}. Identify
96	96	}
97	97	\examples{
98	98	data(scExample, package = "singleCellTK")
99		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	99	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
100	100	sce <- runDecontX(sce)
101	101	}

...	...	@@ -93,7 +93,7 @@ This function is a wrapper function for \link[scran]{doubletCells}.
93	93	}
94	94	\examples{
95	95	data(scExample, package = "singleCellTK")
96		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	96	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
97	97	sce <- runDoubletCells(sce)
98	98	}
99	99	\references{

...	...	@@ -54,6 +54,6 @@ Uses doubletFinder to determine cells within the dataset
54	54	}
55	55	\examples{
56	56	data(scExample, package = "singleCellTK")
57		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	57	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
58	58	sce <- runDoubletFinder(sce)
59	59	}

...	...	@@ -138,6 +138,6 @@ A wrapper function that calls \code{scrub_doublets} from python
138	138	}
139	139	\examples{
140	140	data(scExample, package = "singleCellTK")
141		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	141	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
142	142	sce <- runScrublet(sce)
143	143	}

...	...	@@ -24,6 +24,6 @@ Plot QC metrics generated from QC algorithms via either kable or csv file.
24	24	}
25	25	\examples{
26	26	data(scExample, package = "singleCellTK")
27		-sce <- sce[, colData(sce)$type != 'EmptyDroplet']
	27	+sce <- subsetSCECols(sce, colData = "type != 'EmptyDroplet'")
28	28	sampleSummaryStats(sce, simple = TRUE)
29	29	}