GoekeLab
diff --git a/‎.Rbuildignore‎
Lines changed: 3 additions & 0 deletions b/‎.Rbuildignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 0 additions & 3 deletions b/‎.gitignore‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎DESCRIPTION‎
Lines changed: 2 additions & 2 deletions b/‎DESCRIPTION‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎NAMESPACE‎
Lines changed: 0 additions & 6 deletions b/‎NAMESPACE‎
Lines changed: 0 additions & 6 deletions
diff --git a/‎R/PromoterAnnotation-class.R‎
Lines changed: 3 additions & 3 deletions b/‎R/PromoterAnnotation-class.R‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎R/annotation-data.R‎
Lines changed: 2 additions & 2 deletions b/‎R/annotation-data.R‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎R/data.R‎
Lines changed: 12 additions & 71 deletions b/‎R/data.R‎
Lines changed: 12 additions & 71 deletions
diff --git a/‎R/estimate-promoter-activity.R‎
Lines changed: 1 addition & 45 deletions b/‎R/estimate-promoter-activity.R‎
Lines changed: 1 addition & 45 deletions
diff --git a/‎R/junction-read-count.R‎
Lines changed: 1 addition & 38 deletions b/‎R/junction-read-count.R‎
Lines changed: 1 addition & 38 deletions
diff --git a/‎R/plot-proActiv.R‎
Lines changed: 22 additions & 17 deletions b/‎R/plot-proActiv.R‎
Lines changed: 22 additions & 17 deletions
@@ -2,3 +2,6 @@
 ^\.Rproj\.user$
 ^LICENSE\.md$
 ^README\.Rmd$
+^_pkgdown\.yml$
+^docs$
+^pkgdown$
@@ -38,9 +38,6 @@ vignettes/*.pdf
 # R Environment Variables
 .Renviron
 
-# pkgdown site
-docs/
-
 .Rproj.user
 
 proActiv.Rproj
 
@@ -53,8 +53,8 @@ Suggests:
     DEXSeq,
     Rtsne,
     ggplot2,
-    TxDb.Hsapiens.UCSC.hg38.knownGene,
-    tidyr
+    tidyr,
+    vdiffr
 URL: https://github.com/GoekeLab/proActiv
 biocViews:
     RNASeq,
 
@@ -5,19 +5,13 @@ export(PromoterAnnotation)
 export(arrange)
 export(as_tibble)
 export(assays)
-export(calculateJunctionReadCounts)
-export(calculatePromoterReadCounts)
 export(colData)
 export(filter)
-export(getAbsolutePromoterActivity)
-export(getGeneExpression)
-export(getRelativePromoterActivity)
 export(group_by)
 export(loadDb)
 export(metadata)
 export(mutate)
 export(n)
-export(normalizePromoterReadCounts)
 export(plotPromoters)
 export(preparePromoterAnnotation)
 export(proActiv)
 
@@ -49,11 +49,11 @@ setClass(
 #' 
 #' promoterAnnotation <- PromoterAnnotation()
 #' intronRanges(promoterAnnotation) <- intronRanges(
-#'                                             promoterAnnotation.gencode.v19)
+#'                                     promoterAnnotation.gencode.v34.subset)
 #' promoterIdMapping(promoterAnnotation) <- promoterIdMapping(
-#'                                             promoterAnnotation.gencode.v19)
+#'                                     promoterAnnotation.gencode.v34.subset)
 #' promoterCoordinates(promoterAnnotation) <- promoterCoordinates(
-#'                                             promoterAnnotation.gencode.v19)
+#'                                     promoterAnnotation.gencode.v34.subset)
 #' 
 
 PromoterAnnotation <-
 
@@ -1,4 +1,4 @@
-#' Prepare promoter annotation data for the user specified txdb object
+#' Prepares promoter annotation from a gtf or txdb 
 #'
 #' @param txdb A txdb object. The txdb of the annotation version for which
 #'   promoters will be identified. Either `txdb` or `file` argument must be 
@@ -18,7 +18,7 @@
 #' @examples
 #' 
 #' txdbPath <- system.file('extdata/vignette/annotations/',
-#'                             'gencode.v34.annotation.chr22.sqlite', 
+#'                             'gencode.v34.annotation.subset.sqlite', 
 #'                              package = 'proActiv')
 #' txdb <- AnnotationDbi::loadDb(txdbPath)
 #' promoterAnnotation <- preparePromoterAnnotation(txdb = txdb,
 
@@ -1,75 +1,16 @@
-#' Promoter annotation data for Gencode.v19 including all the annotation objects
-#' required for promoter activity estimation
-#'
-#' A GRanges object containing the tss coordinate for each promoter for Gencode
-#' v19
-#'
-#' @format A PromoterAnnotation (S4 Class) object containing all the promoter
-#'   annotation objects for Gencode.v19. The object has 3 slots: \describe{
-#'   \item{intronRanges}{A GRanges object of 344,651 ranges corresponding
-#'   to introns, annotated with the associated transcript.} 
-#'   \item{promoterIdMapping}{The id mapping between transcript names, 
-#'   promoter ids and gene ids for Gencode v19.} 
-#'   \item{promoterCoordinates}{A GRanges object of 113,076 ranges
-#'   showing the tss coordinate for each promoter of Gencode v19,
-#'   annotated with the associated gene id, coordinate of the 3' end of the first
-#'   reduced exon, and intron id.} }
-#'
-"promoterAnnotation.gencode.v19"
-
-#' Promoter annotation data for Gencode.v34 including all the annotation objects
-#' required for promoter activity estimation
-#'
-#' A GRanges object containing the tss coordinate for each promoter for Gencode
-#' v34
-#'
-#' @format A PromoterAnnotation (S4 Class) object containing all the promoter
-#'   annotation objects for Gencode.v34. The object has 3 slots: \describe{
-#'   \item{intronRanges}{A GRanges object of 383,654 ranges corresponding
+#' @title Promoter annotation for Gencode.v34 (subset) 
+#' @description Promoter annotation for Gencode.v34 
+#'   (chr1:10,000,000 - 30,000,000) 
+#' @format A PromoterAnnotation (S4 Class) object containing all promoter
+#'   annotation objects for Gencode.v34 chr1:10,000,000-30,000,000. 
+#'   The object has 3 slots: \describe{
+#'   \item{intronRanges}{A GRanges object of 4,523 ranges corresponding
 #'   to introns, annotated with the associated transcript.} 
 #'   \item{promoterIdMapping}{The id mapping between transcript names, 
 #'   promoter ids and gene ids for Gencode v34.} 
-#'   \item{promoterCoordinates}{A GRanges object of 122,635 ranges
-#'   showing the tss coordinate for each promoter of Gencode v34,
-#'   annotated with the associated gene id, coordinate of the 3' end of the first
-#'   reduced exon, and intron id.} }
-#'
-"promoterAnnotation.gencode.v34"
-
-#' Promoter annotation data for Gencode.vM1 including all the annotation objects
-#' required for promoter activity estimation
-#'
-#' A GRanges object containing the tss coordinate for each promoter for Gencode
-#' vM1
-#'
-#' @format A PromoterAnnotation (S4 Class) object containing all the promoter
-#'   annotation objects for Gencode.vM1. The object has 3 slots: \describe{
-#'   \item{intronRanges}{A GRanges object of 243,332 ranges corresponding
-#'   to introns, annotated with the associated transcript.} 
-#'   \item{promoterIdMapping}{The id mapping between transcript names, 
-#'   promoter ids and gene ids for Gencode vM1.} 
-#'   \item{promoterCoordinates}{A GRanges object of 60,768 ranges
-#'   showing the tss coordinate for each promoter of Gencode vM1,
-#'   annotated with the associated gene id, coordinate of the 3' end of the first
-#'   reduced exon, and intron id.} }
-#'
-"promoterAnnotation.gencode.vM1"
-
-#' Promoter annotation data for Gencode.vM25 including all the annotation objects
-#' required for promoter activity estimation
-#'
-#' A GRanges object containing the tss coordinate for each promoter for Gencode
-#' vM25
-#'
-#' @format A PromoterAnnotation (S4 Class) object containing all the promoter
-#'   annotation objects for Gencode.vM25. The object has 3 slots: \describe{
-#'   \item{intronRanges}{A GRanges object of 285,067 ranges corresponding
-#'   to introns, annotated with the associated transcript.} 
-#'   \item{promoterIdMapping}{The id mapping between transcript names, 
-#'   promoter ids and gene ids for Gencode vM25.} 
-#'   \item{promoterCoordinates}{A GRanges object of 91,902 ranges
-#'   showing the tss coordinate for each promoter of Gencode vM25,
-#'   annotated with the associated gene id, coordinate of the 3' end of the first
-#'   reduced exon, and intron id.} }
+#'   \item{promoterCoordinates}{A GRanges object of 1,380 ranges
+#'   showing the tss coordinate for each promoter of Gencode v34 
+#'   chr1:10,000,000-30,000,000, annotated with the associated gene id, 
+#'   coordinate of the 3' end of the first reduced exon, and intron id.} }
 #'
-"promoterAnnotation.gencode.vM25"
+"promoterAnnotation.gencode.v34.subset"
@@ -10,23 +10,6 @@
 #' @param pseudocount Number to be used for log2 as pseudocount if log2 is TRUE
 #'
 #' @return data.frame of absolute promoter activity with promoter and gene ids
-#' @export
-#'
-#' @examples
-#' 
-#' ## junctionReadCounts is an object returned from normalizePromoterReadCounts
-#' junctionReadCounts <- readRDS(system.file('extdata/testdata/tophat2',
-#'                                             'normalizedPromoterCounts.rds', 
-#'                                              package = 'proActiv'))
-#' absolutePromoterActivity <- getAbsolutePromoterActivity(junctionReadCounts,
-#'                                              promoterAnnotation.gencode.v19,
-#'                                              log2 = TRUE,
-#'                                              pseudocount = 1)
-#'
-#' @seealso \code{\link{preparePromoterAnnotation}} for preparing the mapping
-#'   between promoters and genes, \code{\link{calculatePromoterReadCounts}} and
-#'   \code{\link{normalizePromoterReadCounts}} for obtaining junction read
-#'   counts
 #'
 getAbsolutePromoterActivity <- function(junctionReadCounts, promoterAnnotation,
                                         log2 = TRUE, pseudocount = 1) {
@@ -50,18 +33,7 @@ getAbsolutePromoterActivity <- function(junctionReadCounts, promoterAnnotation,
 #' @param absolutePromoterActivity data.frame of absolute promoter activity 
 #'   with promoter and gene ids
 #'
-#' @return data.frame of gene expression with gene ids
-#' @export
-#'
-#' @examples
-#' 
-#' ## absolutePromoterActivity is an object returned 
-#' ## from getAbsolutePromoterActivity
-#' absolutePromoterActivity <- readRDS(system.file('extdata/testdata/tophat2', 
-#'                                              'absolutePromoterActivity.rds', 
-#'                                               package = 'proActiv')) 
-#' geneExpression <- getGeneExpression(absolutePromoterActivity)
-#' 
+#' @return data.frame of gene expression with gene ids#'
 #'
 getGeneExpression <- function(absolutePromoterActivity) {
     print('Calculating gene expression...')
@@ -88,22 +60,6 @@ getGeneExpression <- function(absolutePromoterActivity) {
 #' @param geneExpression data.frame of gene expression with gene ids
 #'
 #' @return data.frame of relative promoter activity with promoter and gene ids
-#' @export
-#'
-#' @examples
-#' 
-#' ## absolutePromoterActivity is an object returned 
-#' ## from getAbsolutePromoterActivity
-#' ## geneExpression is an object returned from getGeneExpression
-#' absolutePromoterActivity <- readRDS(system.file('extdata/testdata/tophat2', 
-#'                                             'absolutePromoterActivity.rds', 
-#'                                             package = 'proActiv'))
-#' geneExpression <- readRDS(system.file('extdata/testdata/tophat2', 
-#'                                         'geneExpression.rds', 
-#'                                          package = 'proActiv'))
-#' relativePromoterActivity <- getRelativePromoterActivity(
-#'                                          absolutePromoterActivity,
-#'                                          geneExpression)
 #'
 getRelativePromoterActivity <- function(absolutePromoterActivity, 
                                         geneExpression) {
 
@@ -10,21 +10,8 @@
 #'   'star' or 'bam'
 #' @param genome character genome version
 #'
-#' @export
 #' @return The total number of junction reads overlapping with each promoter for
 #'   the input annotated intron ranges
-#'
-#' @examples
-#' 
-#' file <- list.files(system.file('extdata/testdata/tophat2', 
-#'                    package = 'proActiv'), 
-#'                    full.names = TRUE, pattern = 'sample1')
-#' promoterCoordinates <- promoterCoordinates(promoterAnnotation.gencode.v19)
-#' intronRanges <- intronRanges(promoterAnnotation.gencode.v19)
-#' junctionCounts <- calculateJunctionReadCounts(promoterCoordinates,
-#'                                                intronRanges,
-#'                                                file,
-#'                                                fileType = 'tophat')
 #' 
 #' @importFrom GenomeInfoDb seqlevelsStyle
 #' @importFrom S4Vectors queryHits
@@ -100,22 +87,8 @@ calculateJunctionReadCounts <- function(promoterCoordinates, intronRanges,
 #'
 #' @return A data.frame object. The number of junction reads per promoter (rows)
 #'   for each sample (cols)
-#' @export
-#'
-#' @examples
-#' 
-#' files <- list.files(system.file('extdata/testdata/tophat2', 
-#'                     package = 'proActiv'), 
-#'                     full.names = TRUE, pattern = 'sample')
-#' fileLabels <- c('sample1', 'sample2')
-#' promoterAnnotation <- promoterAnnotation.gencode.v19
-#' promoterReadCounts <- calculatePromoterReadCounts(promoterAnnotation,
-#'                                                    files,
-#'                                                    fileLabels,
-#'                                                    fileType = 'tophat',
-#'                                                    genome = NULL,
-#'                                                    numberOfCores = 1)
 #' @importFrom BiocParallel bpparam bplapply
+#' 
 calculatePromoterReadCounts <- function(promoterAnnotation, files = NULL, 
                                         fileLabels = NULL, fileType = NULL , 
                                         genome = NULL, numberOfCores = 1) {
@@ -160,16 +133,6 @@ calculatePromoterReadCounts <- function(promoterAnnotation, files = NULL,
 #' @return A data.frame object. The normalized number of junction reads per
 #'   promoter (rows) for each sample (cols) using DESeq2 counts function.
 #'   Requires 'DESeq2' package to be installed
-#' @export
-#'
-#' @examples
-#' 
-#' ## promoterReadCounts is an object returned from calculatePromoterReadCounts
-#' promoterReadCounts <- readRDS(system.file('extdata/testdata/tophat2',
-#'                                           'promoterCounts.rds', 
-#'                                            package = 'proActiv'))
-#' normalizedPromoterReadCounts <- normalizePromoterReadCounts(
-#'                                            promoterReadCounts)
 #' 
 #' @importFrom DESeq2 DESeqDataSetFromMatrix estimateSizeFactors counts
 normalizePromoterReadCounts <- function(promoterReadCounts) {
 
@@ -1,5 +1,4 @@
-#' Wrapper function returning Summarized Experiment object giving promoter 
-#' counts and activity
+#' Visualizes promoter activity and transcript model for a gene of interest
 #'
 #' @param result A SummarizedExperiment object with assays giving promoter 
 #'   counts and activity with gene expression stored as column data and 
@@ -39,17 +38,23 @@
 #'   
 #' @examples 
 #'  
-#'  gene <- 'ENSG00000076864.19'
-#'  ## Genomic Ranges giving exons by transcripts of gene 
-#'  ranges <- readRDS(system.file('extdata/vignette/annotations', 
-#'                                'exonsBy.rap1gap.rds',
-#'                                package = 'proActiv'))
-#'  ## summarizedExperiment returned by proActiv (subsetted to gene RAP1GAP)
-#'  result <- readRDS(system.file('extdata/vignette/annotations',
-#'                                'result.rap1gap.rds',
-#'                                package ='proActiv'))
-#'  plotPromoters(result = result, gene = gene, ranges = ranges)
-#'   
+#' ## First, run proActiv to generate a summarizedExperiment result
+#' files <- list.files(system.file('extdata/vignette/junctions', 
+#'                        package = 'proActiv'), 
+#'                        full.names = TRUE)
+#' promoterAnnotation <- promoterAnnotation.gencode.v34.subset
+#' result <- proActiv(files = files,
+#'                        promoterAnnotation  = promoterAnnotation,
+#'                        condition = rep(c('A549','HepG2'), each=3),
+#'                        ncores = 1)
+#' ## Read in pre-computed ranges
+#' txdb <- AnnotationDbi::loadDb(system.file('extdata/vignette/annotations',
+#'                                    'gencode.v34.annotation.rap1gap.sqlite',
+#'                                    package = 'proActiv'))
+#' ## Declare a gene of interest
+#' gene <- 'ENSG00000076864.19'
+#' ## Call plot 
+#' plotPromoters(result = result, gene = gene, txdb = txdb)
 #'                            
 #' @importFrom Gviz plotTracks GenomeAxisTrack
 #' @importFrom SummarizedExperiment rowData colData
@@ -61,16 +66,16 @@ plotPromoters <- function(result, gene, txdb, ranges,
                             label.col = 'black', label.size = 0.7,
                             arrow.width = NULL, arrow.fill = 'transparent', 
                             arrow.border = 'grey') {
-    print(paste0('Plotting ', gene))
     result.gene <- result[rowData(result)$geneId == gene, ]
     rdata <- rowData(result.gene)[complete.cases(rowData(result.gene)),]
     groups <- unique(colData(result.gene)$condition)
 
     if (nrow(rdata) == 0) {
-        stop('Gene selected has only one transcript which is a single-exon
-            transcript. proActiv does not estimate promoter activity in 
-            such cases.')
+        stop('Gene ID selected is either not present or has only one transcript 
+            which is a single-exon transcript. proActiv does not estimate 
+            promoter activity in such cases.')
     }
+    print(paste0('Plotting ', gene))
 
     grtrack <- getGeneRegionTrack(rdata, gene, txdb, ranges)
     dtracklist <- getDataTrack(rdata, groups, blk.width = blk.width,