Bioconductor Code: TDbasedUFEadv

Browse code

Modification due to the usage of RTCGA.clinical

tagtag authored on 16/02/2023 06:54:26
Showing 9 changed files

DESCRIPTION index 0d5f497..458e0a0 100644
NAMESPACE index 3802af2..c27c394 100644
R/prepareCondTCGA.R index 0000000..8c68d74
man/prepareCondTCGA.Rd index 0000000..d484e2f
vignettes/Enrichment.Rmd index 1658d53..c346500 100644
vignettes/QuickStart.Rmd index 3941cfe..5169555 100644
vignettes/QuickStart2.Rmd index e82c637..04b3b13 100644
vignettes/fig21.jpg index 83cb710..01cb38f 100644
vignettes/fig22.jpg index 6b918bf..1b2c366 100644

History View file @ 70f2697

@@ -38,7 +38,7 @@ Imports:
                          RITAN,
                          STRINGdb,
                          enrichR
                     -RoxygenNote: 7.2.0
                     +RoxygenNote: 7.2.3
                      Suggests:
                          knitr,
                          rmarkdown,

NAMESPACE

History View file @ 70f2697

@@ -3,6 +3,7 @@
                      export(PrepareSummarizedExperimentTensorRect)
                      export(computeSVD)
                      export(prepareCondDrugandDisease)
                     +export(prepareCondTCGA)
                      export(prepareTensorfromList)
                      export(prepareTensorfromMatrix)
                      export(prepareexpDrugandDisease)

R/prepareCondTCGA.R

History View file @ 70f2697

                     new file mode 100644
@@ -0,0 +1,33 @@
                     +#' Title Prepare Sample label for TCGA data
                     +#'
                     +#' @param Multi_sample list of sample ids
                     +#' @param Clinical List of clinical data matrix from RTCGA.clinical
                     +#' @param k Column numbers used for conditions
                     +#' @param j Column numbers that include corresponding sample ids
                     +#' in clinical data
                     +#'
                     +#' @return list of sample labels
                     +#' @export
                     +#'
                     +#' @examples
                     +#' require(RTCGA.clinical)
                     +#' require(RTCGA.rnaseq)
                     +#' Clinical <- list(BLCA.clinical,BRCA.clinical,CESC.clinical,COAD.clinical)
                     +#' Multi_sample <- list(BLCA.rnaseq[seq_len(100),1,drop=F],
                     +#'                     BRCA.rnaseq[seq_len(100),1,drop=F],
                     +#'                     CESC.rnaseq[seq_len(100),1,drop=F],
                     +#'                     COAD.rnaseq[seq_len(100),1,drop=F])
                     +#' k <- c(770,1482,773,791)
                     +#' j <- c(20,20,12,14)
                     +#' cond <- prepareCondTCGA(Multi_sample,Clinical,k,j)
                     +prepareCondTCGA <- function(Multi_sample,Clinical,k,j)
                     +{
                     +    Cond <- rep(list(NA),length(Multi_sample))
                     +    for (i in seq_len(length(Multi_sample)))
                     +    {
                     +        index <- match(tolower(substring(Multi_sample[[i]][,1],1,12)),
                     +                       Clinical[[i]][,j[i]])
                     +        Cond[[i]]<- Clinical[[i]][index,k[i]]
                     +    }
                     +    return(Cond)
                     +}
                     \ No newline at end of file

man/prepareCondTCGA.Rd

History View file @ 70f2697

                     new file mode 100644
@@ -0,0 +1,36 @@
                     +% Generated by roxygen2: do not edit by hand
                     +% Please edit documentation in R/prepareCondTCGA.R
                     +\name{prepareCondTCGA}
                     +\alias{prepareCondTCGA}
                     +\title{Title Prepare Sample label for TCGA data}
                     +\usage{
                     +prepareCondTCGA(Multi_sample, Clinical, k, j)
                     +}
                     +\arguments{
                     +\item{Multi_sample}{list of sample ids}
+                    +
                     +\item{Clinical}{List of clinical data matrix from RTCGA.clinical}
+                    +
                     +\item{k}{Column numbers used for conditions}
+                    +
                     +\item{j}{Column numbers that include corresponding sample ids
                     +in clinical data}
                     +}
                     +\value{
                     +list of sample labels
                     +}
                     +\description{
                     +Title Prepare Sample label for TCGA data
                     +}
                     +\examples{
                     +require(RTCGA.clinical)
                     +require(RTCGA.rnaseq)
                     +Clinical <- list(BLCA.clinical,BRCA.clinical,CESC.clinical,COAD.clinical)
                     +Multi_sample <- list(BLCA.rnaseq[seq_len(100),1,drop=F],
                     +                    BRCA.rnaseq[seq_len(100),1,drop=F],
                     +                    CESC.rnaseq[seq_len(100),1,drop=F],
                     +                    COAD.rnaseq[seq_len(100),1,drop=F])
                     +k <- c(770,1482,773,791)
                     +j <- c(20,20,12,14)
                     +cond <- prepareCondTCGA(Multi_sample,Clinical,k,j)
                     +}

vignettes/Enrichment.Rmd

History View file @ 70f2697

@@ -39,17 +39,28 @@ In order foe this, we reproduce one exmaple in QuickStart2 as follows.
                      ``` {r}
                      require(RTCGA.rnaseq)
                     -Multi <- list(ACC.rnaseq[seq_len(100),1+seq_len(1000)],
                     -             BLCA.rnaseq[seq_len(100),1+seq_len(1000)],
                     -             BRCA.rnaseq[seq_len(100),1+seq_len(1000)],
                     -             CESC.rnaseq[seq_len(100),1+seq_len(1000)])
                     +Multi <- list(BLCA.rnaseq[seq_len(100),1+seq_len(1000)],
                     +              BRCA.rnaseq[seq_len(100),1+seq_len(1000)],
                     +              CESC.rnaseq[seq_len(100),1+seq_len(1000)],
                     +              COAD.rnaseq[seq_len(100),1+seq_len(1000)])
                      Z <- prepareTensorfromList(Multi,10)
                      Z <- aperm(Z,c(2,1,3))
                     +require(RTCGA.clinical)
                     +Clinical <- list(BLCA.clinical,BRCA.clinical,CESC.clinical,COAD.clinical)
                     +Multi_sample <- list(BLCA.rnaseq[seq_len(100),1,drop=F],
                     +              BRCA.rnaseq[seq_len(100),1,drop=F],
                     +              CESC.rnaseq[seq_len(100),1,drop=F],
                     +              COAD.rnaseq[seq_len(100),1,drop=F])
                     +#patient.stage_event.tnm_categories.pathologic_categories.pathologic_m
                     +k <- c(770,1482,773,791)
                     +#patient.bcr_patient_barcode
                     +j <- c(20,20,12,14)
                      Z <- PrepareSummarizedExperimentTensor(
                          feature =colnames(ACC.rnaseq)[1+seq_len(1000)],
                     -                                       sample=array("",1),value=Z)
                     +    sample=array("",1),value=Z,
                     +    sampleData=prepareCondTCGA(Multi_sample,Clinical,k,j))
                      HOSVD <- computeHosvd(Z)
                     -cond<- rep(list(rep(seq_len(2),each=50)),4)
                     +cond<- attr(Z,"sampleData")
                      index <- selectFeatureProj(HOSVD,Multi,cond,de=1e-3,input_all=2) #Batch mode
                      head(tableFeatures(Z,index))
                      genes <-unlist(lapply(strsplit(tableFeatures(Z,index)[,1],"|",fixed=T),"[",1))

vignettes/QuickStart.Rmd

History View file @ 70f2697

@@ -394,7 +394,7 @@ Pressing enter we can get these two plots as well.
                      Since package does not allow us interactive mode, we place here bacth mode.
                      ```{r, fig.keep='none'}
                     -index_all <- selectFeatureRect(SVD,cond,de=c(0.5,0.5),input_all=6)
                     +index_all <- selectFeatureRect(SVD,cond,de=c(0.5,0.5),input_all=6) #batch mode
                      ```
                      Then we can list the Drugs and Methylation sites selected as being distinct
                      between male and female.

vignettes/QuickStart2.Rmd

History View file @ 70f2697

@@ -122,8 +122,10 @@ Now we discuss what to do when multiple omics data share not samples but feature
                      We prepare data set from RTCGA.rnaseq as follows, with retriieving reduced pertial sets from four ones.
                      ```{r}
                      require(RTCGA.rnaseq)
                     -Multi <- list(ACC.rnaseq[seq_len(100),1+seq_len(1000)],BLCA.rnaseq[seq_len(100),1+seq_len(1000)],
                     -             BRCA.rnaseq[seq_len(100),1+seq_len(1000)],CESC.rnaseq[seq_len(100),1+seq_len(1000)])
                     +Multi <- list(BLCA.rnaseq[seq_len(100),1+seq_len(1000)],
                     +              BRCA.rnaseq[seq_len(100),1+seq_len(1000)],
                     +              CESC.rnaseq[seq_len(100),1+seq_len(1000)],
                     +              COAD.rnaseq[seq_len(100),1+seq_len(1000)])
                      ```
                      Multi includes four objects, each of which is matrix that represent 100 samples (rows) and 1000 (featuers). Please note it is different from usual cases where columns and rows are features and samples, respectrively. They are marged into tensor as follows
                      ```{r}
@@ -132,22 +134,33 @@ Z <- aperm(Z,c(2,1,3))
                      ```
                      The function, prepareTeansorfromList which was used in the previous subsection where samples are shared, can be used as it is. However, the first and second modes of a tensor must be exchanged by aperm function for the latter analyses, because of the difference as mentioned in the above. Then tensor object associated with various information is generated as usual as follows and HOSVD was applied to it.
                      ``` {r}
                     -Z <- PrepareSummarizedExperimentTensor(feature =colnames(ACC.rnaseq)[1+seq_len(1000)],
                     -                                       sample=array("",1),value=Z)
                     +require(RTCGA.clinical)
                     +Clinical <- list(BLCA.clinical,BRCA.clinical,CESC.clinical,COAD.clinical)
                     +Multi_sample <- list(BLCA.rnaseq[seq_len(100),1,drop=F],
                     +              BRCA.rnaseq[seq_len(100),1,drop=F],
                     +              CESC.rnaseq[seq_len(100),1,drop=F],
                     +              COAD.rnaseq[seq_len(100),1,drop=F])
                     +#patient.stage_event.tnm_categories.pathologic_categories.pathologic_m
                     +k <- c(770,1482,773,791)
                     +#patient.bcr_patient_barcode
                     +j <- c(20,20,12,14)
                     +Z <- PrepareSummarizedExperimentTensor(
                     +    feature =colnames(ACC.rnaseq)[1+seq_len(1000)],
                     +    sample=array("",1),value=Z,
                     +    sampleData=prepareCondTCGA(Multi_sample,Clinical,k,j))
                      HOSVD <- computeHosvd(Z)
                      ```
                     -In order to see which sibgular value vectors attributed to samples are used for the selection of signular value vectors attributed to features, we need to assign sample conditions.
                     -Since we do not have any information about samples, we simply assume that they are devided into half and half as follows.
                     +In order to see which singular value vectors attributed to samples are used for the selection of singular value vectors attributed to features, we need to assign sample conditions.
                      ```{r}
                     -cond<- rep(list(rep(seq_len(2),each=50)),4)
                     +cond<- attr(Z,"sampleData")
                      ```
                      Then perform this
                      ```
                     -par(mai=c(0.1,0.2,0.2,0.2))
                     +par(mai=c(0.3,0.2,0.2,0.2))
                      index <- selectFeatureProj(HOSVD,Multi,cond,de=1e-3)
                      ```
                      Although we do not intend to explain how to use menu interactively,
                     -we select the second singular value vectors as shown in below
                     +we select the third singular value vectors as shown in below
                      ![The second singular value vectors](./fig21.jpg)
                      and we get the following plot, too.
@@ -156,7 +169,7 @@ and we get the following plot, too.
                      Since package does not allow us to include inteartive mode, we place here batch mode as follows.
                      Finally, selected feature are listed as follows.
                      ``` {r, fig.keep="none"}
                     -index <- selectFeatureProj(HOSVD,Multi,cond,de=1e-3,input_all=2) #Batch mode
                     +index <- selectFeatureProj(HOSVD,Multi,cond,de=1e-3,input_all=3) #Batch mode
                      head(tableFeatures(Z,index))
                      ```

vignettes/fig21.jpg

History View file @ 70f2697

163

176

Binary files a/vignettes/fig21.jpg and b/vignettes/fig21.jpg differ

vignettes/fig22.jpg

History View file @ 70f2697

164

177

Binary files a/vignettes/fig22.jpg and b/vignettes/fig22.jpg differ