showteeth
diff --git a/‎DESCRIPTION‎
Lines changed: 6 additions & 3 deletions b/‎DESCRIPTION‎
Lines changed: 6 additions & 3 deletions
diff --git a/‎NAMESPACE‎
Lines changed: 8 additions & 0 deletions b/‎NAMESPACE‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎NEWS.md‎
Lines changed: 15 additions & 7 deletions b/‎NEWS.md‎
Lines changed: 15 additions & 7 deletions
diff --git a/‎R/LoadTrack.R‎
Lines changed: 82 additions & 41 deletions b/‎R/LoadTrack.R‎
Lines changed: 82 additions & 41 deletions
@@ -1,7 +1,7 @@
 Package: ggcoverage
 Type: Package
 Title: Visualize Genome Coverage with Various Annotations
-Version: 0.6.0
+Version: 0.7.0
 Authors@R: 
     person(given = "Yabing",
            family = "Song",
@@ -10,7 +10,7 @@ Authors@R:
 Maintainer: Yabing Song <[email protected]>
 Description: The goal of 'ggcoverage' is to simplify the process of visualizing genome coverage. It contains functions to 
     load data from 'BAM', 'BigWig' or 'BedGraph' files, create genome coverage plot, add various annotations to 
-    the coverage plot, including GC annotation, gene annotation, transcript annotation, ideogram annotation and peak annotation.
+    the coverage plot, including base and amino acid annotaion, GC annotation, gene annotation, transcript annotation, ideogram annotation and peak annotation.
 License: MIT + file LICENSE
 Encoding: UTF-8
 RoxygenNote: 7.1.1
@@ -37,7 +37,10 @@ Imports:
     GenomeInfoDb,
     S4Vectors,
     Biostrings,
-    BSgenome
+    BSgenome,
+    GenomicAlignments,
+    reshape2,
+    seqinr
 Suggests: 
     rmarkdown,
     knitr,
 
@@ -1,12 +1,14 @@
 # Generated by roxygen2: do not edit by hand
 
+S3method(ggplot_add,base)
 S3method(ggplot_add,gc)
 S3method(ggplot_add,gene)
 S3method(ggplot_add,ideogram)
 S3method(ggplot_add,peak)
 S3method(ggplot_add,transcript)
 export(FormatTrack)
 export(LoadTrackFile)
+export(geom_base)
 export(geom_coverage)
 export(geom_gc)
 export(geom_gene)
@@ -22,6 +24,7 @@ importFrom(Biostrings,readDNAStringSet)
 importFrom(GenomeInfoDb,"seqlengths<-")
 importFrom(GenomeInfoDb,seqlengths)
 importFrom(GenomeInfoDb,seqnames)
+importFrom(GenomicAlignments,alphabetFrequencyFromBam)
 importFrom(GenomicRanges,GRanges)
 importFrom(GenomicRanges,makeGRangesFromDataFrame)
 importFrom(GenomicRanges,setdiff)
@@ -51,12 +54,15 @@ importFrom(ggplot2,element_blank)
 importFrom(ggplot2,element_rect)
 importFrom(ggplot2,element_text)
 importFrom(ggplot2,expansion)
+importFrom(ggplot2,geom_bar)
 importFrom(ggplot2,geom_hline)
+importFrom(ggplot2,geom_label)
 importFrom(ggplot2,geom_line)
 importFrom(ggplot2,geom_polygon)
 importFrom(ggplot2,geom_rect)
 importFrom(ggplot2,geom_segment)
 importFrom(ggplot2,geom_text)
+importFrom(ggplot2,geom_tile)
 importFrom(ggplot2,ggplot)
 importFrom(ggplot2,ggplot_add)
 importFrom(ggplot2,labs)
@@ -74,10 +80,12 @@ importFrom(grDevices,colorRampPalette)
 importFrom(magrittr,"%>%")
 importFrom(methods,extends)
 importFrom(patchwork,wrap_plots)
+importFrom(reshape2,melt)
 importFrom(rlang,.data)
 importFrom(rlang,as_label)
 importFrom(rtracklayer,import)
 importFrom(scales,comma)
+importFrom(seqinr,translate)
 importFrom(stats,as.formula)
 importFrom(utils,menu)
 importFrom(utils,read.csv)
 
@@ -1,22 +1,30 @@
-# ggcoverage 0.6.0
+# ggcoverage 0.7.0
 ## New features
-* Add `geom_gc` to annotate genome coverage with GC content. 
+* Added `geom_base` to annotate genome coverage with base and amino acids.
+
+## Minor changes
+* `LoadTrackFile` supported visualization at single-nucleotide level.
+* Added `rect.color` for `geom_coverage` to control  rect border color.
+* Fixed bug in track file format identification.
 
 -------------
 
-# ggcoverage 0.5.0
+# ggcoverage 0.6.0
 ## New features
-* First CRAN release.
+* Added `geom_gc` to annotate genome coverage with GC content. 
+
+-------------
 
+# ggcoverage 0.5.0
 ## Minor changes
-* Fix bug in `getIdeogram`.
+* Fixed bug in `getIdeogram`.
 
 -------------
 
 # ggcoverage 0.4.0
 ## New features
 * Added `geom_peak` to enhance its usage in ChIP-seq or ATAC-seq data.
-* Change Y axis theme.
+* Changed Y axis theme.
 
 -------------
 
@@ -25,7 +33,7 @@
 * Added `geom_transcript`, `geom_ideogram`.
 
 ## Minor changes
-* Fix bug in `GetGeneGroup`.
+* Fixed bug in `GetGeneGroup`.
 
 -------------
 
 
@@ -10,13 +10,18 @@
 #' @param bamcoverage.path The path to \code{bamCoverage}, used when \code{format} is bam. Default: NULL (auto-detect).
 #' @param norm.method Methods to normalize the number of reads per bin, chosen from "RPKM", "CPM", "BPM", "RPGC", "None".
 #' Default: RPKM.
+#' @param single.nuc Logical value, whether to visualize at single nucleotide level. Default: FALSE.
+#' @param single.nuc.region Region for \code{single.nuc}. Default: NULL
 #' @param bin.size Size of the bins, in bases. Default: 50.
 #' @param bc.extra.para Extra parameters for \code{bamCoverage}, eg: "--effectiveGenomeSize 2700000000 --ignoreForNormalization chrX"
 #'
 #' @return A dataframe.
 #' @importFrom rtracklayer import
 #' @importFrom Rsamtools indexBam
 #' @importFrom utils read.csv
+#' @importFrom GenomicAlignments alphabetFrequencyFromBam
+#' @importFrom magrittr %>%
+#' @importFrom dplyr select
 #' @export
 #'
 #' @examples
@@ -35,37 +40,32 @@
 #' )
 LoadTrackFile <- function(track.file, track.folder = NULL, format = c("bam", "wig", "bw", "bedgraph"), meta.info = NULL, meta.file = "",
                           bamcoverage.path = NULL, norm.method = c("RPKM", "CPM", "BPM", "RPGC", "None"),
-                          bin.size = 10, bc.extra.para = NULL) {
+                          single.nuc = FALSE, single.nuc.region = NULL, bin.size = 10, bc.extra.para = NULL) {
   # check parameters
   format <- match.arg(arg = format)
   norm.method <- match.arg(arg = norm.method)
 
   # prepare track files
   if (!is.null(track.folder)) {
-    track.file <- list.files(path = track.folder, full.names = TRUE, pattern = format)
+    track.file <- list.files(path = track.folder, full.names = TRUE, pattern = paste0(format, "$"))
   }
 
   # get track dataframe
   if (format %in% c("wig", "bw", "bedgraph")) {
-    # read track file
-    track.list <- lapply(track.file, function(x) {
-      # get basename
-      track.file.base <- basename(x)
-      # import wig, bigwig and bedgraph file
-      single.track.df <- as.data.frame(rtracklayer::import(x))
-      single.track.df$TrackFile <- track.file.base
-      return(single.track.df)
-    })
-  } else if (format == "bam") {
-    # require deeptools
-    if (is.null(bamcoverage.path)) {
-      bamcoverage.path <- Sys.which("bamCoverage")
-      if (bamcoverage.path == "") {
-        stop("Can not find bamCoverage automatically, please specify the path!")
-      }
+    if (single.nuc) {
+      stop("To visualize single nucleotide, please use bam file!")
     } else {
-      bamcoverage.path <- bamcoverage.path
+      # read track file
+      track.list <- lapply(track.file, function(x) {
+        # get basename
+        track.file.base <- basename(x)
+        # import wig, bigwig and bedgraph file
+        single.track.df <- as.data.frame(rtracklayer::import(x))
+        single.track.df$TrackFile <- track.file.base
+        return(single.track.df)
+      })
     }
+  } else if (format == "bam") {
     # create index
     for (bam in track.file) {
       bam.index.file <- paste(bam, "bai", sep = ".")
@@ -74,29 +74,70 @@ LoadTrackFile <- function(track.file, track.folder = NULL, format = c("bam", "wi
         Rsamtools::indexBam(bam)
       }
     }
-    # read track file
-    track.list <- lapply(track.file, function(x) {
-      # get basename
-      track.file.base <- basename(x)
-      # bigwig file
-      out.bw.file <- tempfile(fileext = c(".bw"))
-      # prepare bamCoverage cmd
-      bamcoverage.cmd <- paste(
-        bamcoverage.path, "-b", x, "-o", out.bw.file,
-        "--binSize", bin.size, "--normalizeUsing", norm.method, bc.extra.para
-      )
-      # run command
-      message(paste("Calling bamCoverage: ", bamcoverage.cmd))
-      bamcoverage.status <- system(bamcoverage.cmd, intern = TRUE)
-      bamcoverage.status.code <- attr(bamcoverage.status, "status")
-      if (!is.null(bamcoverage.status.code)) {
-        stop("Run bamCoverage error!")
+    if (single.nuc) {
+      if (!is.null(single.nuc.region)) {
+        single.nuc.region <- gsub(pattern = ",", replacement = "", x = single.nuc.region)
+        single.nuc.region.chr <- unlist(strsplit(x = single.nuc.region, split = ":"))[1]
+        single.nuc.region.se <- unlist(strsplit(x = single.nuc.region, split = ":"))[2]
+        single.nuc.region.start <- unlist(strsplit(x = single.nuc.region.se, split = "-"))[1]
+        single.nuc.region.end <- unlist(strsplit(x = single.nuc.region.se, split = "-"))[2]
+        track.list <- lapply(track.file, function(x) {
+          single.track.df <- GenomicAlignments::alphabetFrequencyFromBam(x, param = single.nuc.region, baseOnly = TRUE) %>% as.data.frame()
+          single.track.df <- single.track.df[, c("A", "G", "C", "T")]
+          single.track.df$score <- rowSums(single.track.df)
+          single.track.df$seqnames <- single.nuc.region.chr
+          single.track.df$start <- single.nuc.region.start:single.nuc.region.end
+          single.track.df$end <- single.track.df$start + 1
+          single.track.df$width <- 1
+          single.track.df$strand <- "*"
+          single.track.df <- single.track.df %>% dplyr::select(-c("A", "G", "C", "T"))
+          # get basename
+          track.file.base <- basename(x)
+          single.track.df$TrackFile <- track.file.base
+          single.track.df <- single.track.df[c(
+            "seqnames", "start", "end", "width",
+            "strand", "score", "TrackFile"
+          )]
+          return(single.track.df)
+        })
+      } else {
+        stop("Please provide region for visualizing single nucleotide!")
       }
-      # import wig, bigwig and bedgraph file
-      single.track.df <- as.data.frame(rtracklayer::import(out.bw.file))
-      single.track.df$TrackFile <- track.file.base
-      return(single.track.df)
-    })
+    } else {
+      # require deeptools
+      if (is.null(bamcoverage.path)) {
+        bamcoverage.path <- Sys.which("bamCoverage")
+        if (bamcoverage.path == "") {
+          stop("Can not find bamCoverage automatically, please specify the path!")
+        }
+      } else {
+        bamcoverage.path <- bamcoverage.path
+      }
+
+      # read track file
+      track.list <- lapply(track.file, function(x) {
+        # get basename
+        track.file.base <- basename(x)
+        # bigwig file
+        out.bw.file <- tempfile(fileext = c(".bw"))
+        # prepare bamCoverage cmd
+        bamcoverage.cmd <- paste(
+          bamcoverage.path, "-b", x, "-o", out.bw.file,
+          "--binSize", bin.size, "--normalizeUsing", norm.method, bc.extra.para
+        )
+        # run command
+        message(paste("Calling bamCoverage: ", bamcoverage.cmd))
+        bamcoverage.status <- system(bamcoverage.cmd, intern = TRUE)
+        bamcoverage.status.code <- attr(bamcoverage.status, "status")
+        if (!is.null(bamcoverage.status.code)) {
+          stop("Run bamCoverage error!")
+        }
+        # import wig, bigwig and bedgraph file
+        single.track.df <- as.data.frame(rtracklayer::import(out.bw.file))
+        single.track.df$TrackFile <- track.file.base
+        return(single.track.df)
+      })
+    }
   }
   # get track dataframe
   track.df <- do.call(rbind, track.list)