Skip to content

Commit

Permalink
Address #34
Browse files Browse the repository at this point in the history
  • Loading branch information
PoisonAlien committed Oct 28, 2024
1 parent 2a6681f commit 8c4aaa1
Show file tree
Hide file tree
Showing 6 changed files with 147 additions and 69 deletions.
2 changes: 1 addition & 1 deletion DESCRIPTION
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
Package: trackplot
Title: Generate IGV style track plots and profile plots from bigWig files
Version: 1.5.10
Version: 1.6.00
Authors@R: person("Anand", "Mayakonda", , "[email protected]", role = c("aut", "cre"))
Description: trackplot is an ultra-fast, simple, and minimal dependency R script to generate IGV style track plots (aka locus plots), profile plots and heatmaps from bigWig files.
License: MIT
Expand Down
146 changes: 88 additions & 58 deletions R/trackplot.R
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,9 @@
# Copyright (c) 2020 Anand Mayakonda <[email protected]>
#
# Change log:
# Version: 1.6.00 [2024-10-28]
# * Added argument `track_overlay` for a single track with line plot. #14
# * Bug fix: color alpha differs between tracks. Issue: #34
# Version: 1.5.10 [2024-02-14]
# * Added argument `layout_ord` and `bw_ord` to `track_plot()` re-order the overall tracks and bigWig tracks
# * Added `xlab` and `ylab` arguments to `profile_plot()`
Expand Down Expand Up @@ -300,6 +303,7 @@ track_summarize = function(summary_list = NULL, condition = NULL, stat = "mean")
#' @param track_names Default NULL
#' @param track_names_pos Default 0 (corresponds to left corner)
#' @param track_names_to_left If TRUE, track names are shown to the left of the margin. Default FALSE, plots on top as a title
#' @param track_overlay Draws all bigWigs in a single track as a line plot
#' @param regions genomic regions to highlight. A data.frame with at-least three columns containing chr, start and end positions.
#' @param boxcol color for highlighted region. Default "#192A561A"
#' @param boxcolalpha Default 0.5
Expand Down Expand Up @@ -339,10 +343,11 @@ track_plot = function(summary_list = NULL,
track_names = NULL,
track_names_pos = 0,
track_names_to_left = FALSE,
track_overlay = FALSE,
regions = NULL,
collapse_txs = TRUE,
boxcol = "#192A561A",
boxcolalpha = 0.2,
boxcol = "#ffc41a",
boxcolalpha = 0.4,
chromHMM = NULL,
chromHMM_cols = NULL,
chromHMM_names = NULL,
Expand Down Expand Up @@ -469,7 +474,11 @@ track_plot = function(summary_list = NULL,
plot_height_min = round(plot_height_min, digits = 2)
}

ntracks = length(summary_list)
if(is_bw & track_overlay){
ntracks = 1
}else{
ntracks = length(summary_list)
}

lo = .make_layout(ntracks = ntracks, ntracks_h = bw_track_height, cytoband = show_ideogram, cytoband_h = cytoband_track_height, genemodel = draw_gene_track,
genemodel_h = gene_track_height, chrHMM = any(!is.null(ucscChromHMM), !is.null(chromHMM)), chrHMM_h = chromHMM_track_height, loci = !is.null(peaks),
Expand Down Expand Up @@ -526,61 +535,85 @@ track_plot = function(summary_list = NULL,
}

#Draw bigWig signals
boxcol = grDevices::adjustcolor(boxcol, alpha.f = boxcolalpha)
if(is_bw){
for(idx in 1:length(summary_list)){
x = summary_list[[idx]]
if(track_overlay){

if(show_axis){
par(mar = c(0.5, left_mar, 2, 1))
}else{
par(mar = c(0.5, left_mar, 2, 1))
}

plot(NA, xlim = c(start, end), ylim = c(plot_height_min[idx], plot_height[idx]), frame.plot = FALSE, axes = FALSE, xlab = NA, ylab = NA)
#If there is no signal, just add the track names and go to next
if(nrow(x) == 0){
if(track_names_to_left){
text(x = start, y = 0.5, labels = names(summary_list)[idx], adj = 1, cex = gene_fsize, xpd = TRUE)
#mtext(text = names(summary_list)[idx], side = 2, line = -2, outer = TRUE, xpd = TRUE, las = 2, adj = 0)
#title(main = , adj = track_names_pos, font.main = 3)
}else{
title(main = names(summary_list)[idx], adj = track_names_pos, font.main = 3)
plot(NA, xlim = c(start, end), ylim = c(min(plot_height_min), max(plot_height)), frame.plot = FALSE, axes = FALSE, xlab = NA, ylab = NA)
for(idx in 1:length(summary_list)){
x = summary_list[[idx]]
if(nrow(x) == 0){
if(track_names_to_left){
text(x = start, y = 0.5, labels = names(summary_list)[idx], adj = 1, cex = gene_fsize, xpd = TRUE)
#mtext(text = names(summary_list)[idx], side = 2, line = -2, outer = TRUE, xpd = TRUE, las = 2, adj = 0)
#title(main = , adj = track_names_pos, font.main = 3)
}else{
title(main = names(summary_list)[idx], adj = track_names_pos, font.main = 3)
}
next
}
next
points(x = x$start, y = x$max, col = col[idx], type = "l")
}
rect(xleft = x$start, ybottom = 0, xright = x$end, ytop = x$max, col = col[idx], border = col[idx])
if(show_axis){
axis(side = 2, at = c(plot_height_min[idx], plot_height[idx]), las = 2)
}else{
text(x = start, y = plot_height[idx], labels = paste0("[", plot_height_min[idx], "-", plot_height[idx], "]"), adj = 0, xpd = TRUE)
}
#plot(NA, xlim = c(start, end), ylim = c(0, nrow(regions)), frame.plot = FALSE, axes = FALSE, xlab = NA, ylab = NA)

if(plot_regions){
# boxcol = "#192a56"
boxcol = grDevices::adjustcolor(boxcol, alpha.f = boxcolalpha)
if(nrow(regions) > 0){
for(i in 1:nrow(regions)){
if(idx == length(summary_list)){
#If its a last plot, draw rectangle till 0
rect(xleft = regions[i, startpos], ybottom = 0, xright = regions[i, endpos], ytop = plot_height[idx]+10, col = boxcol, border = NA, xpd = TRUE)
}else if (idx == 1){
if(ncol(regions) > 3){
text(x = mean(c(regions[i, startpos], regions[i, endpos])), y = plot_height[idx]+(plot_height[idx]*0.1), labels = regions[i, 4], adj = 0.5, xpd = TRUE, font = 1, cex = 1.2)
}else{
text(x = mean(c(regions[i, startpos], regions[i, endpos])), y = plot_height[idx]+(plot_height[idx]*0.1), labels = paste0(regions[i, startpos], "-", regions[i, endpos]), adj = 0.5, xpd = TRUE, font = 1, cex = 1.2)
}
rect(xleft = regions[i, startpos], ybottom = -10, xright = regions[i, endpos], ytop = plot_height[idx], col = boxcol, border = NA, xpd = TRUE)
}else{
rect(xleft = regions[i, startpos], ybottom = -10, xright = regions[i, endpos], ytop = plot_height[idx]+10, col = boxcol, border = NA, xpd = TRUE)
}
}
if(nrow(x) > 0){
rect(xleft = regions[, startpos], ybottom = 0, xright = regions[, endpos], ytop = max(plot_height), col = boxcol, border = NA, xpd = TRUE)
}
}

if(track_names_to_left){
text(x = start, y = (plot_height_min[idx] + plot_height[idx])/2, labels = names(summary_list)[idx], adj = 1.1, cex = gene_fsize, xpd = TRUE)
}else{
title(main = names(summary_list)[idx], adj = track_names_pos, font.main = 3)
if(show_axis){
axis(side = 2, at = c(min(plot_height_min), max(plot_height)), las = 2)
}
legend(x = "topright", legend = names(summary_list), col = col, pch = "-")
}else{
for(idx in 1:length(summary_list)){
x = summary_list[[idx]]
if(show_axis){
par(mar = c(0.5, left_mar, 2, 1))
}else{
par(mar = c(0.5, left_mar, 2, 1))
}

plot(NA, xlim = c(start, end), ylim = c(plot_height_min[idx], plot_height[idx]), frame.plot = FALSE, axes = FALSE, xlab = NA, ylab = NA)
#If there is no signal, just add the track names and go to next
if(nrow(x) == 0){
if(track_names_to_left){
text(x = start, y = 0.5, labels = names(summary_list)[idx], adj = 1, cex = gene_fsize, xpd = TRUE)
#mtext(text = names(summary_list)[idx], side = 2, line = -2, outer = TRUE, xpd = TRUE, las = 2, adj = 0)
#title(main = , adj = track_names_pos, font.main = 3)
}else{
title(main = names(summary_list)[idx], adj = track_names_pos, font.main = 3)
}
next
}
rect(xleft = x$start, ybottom = 0, xright = x$end, ytop = x$max, col = col[idx], border = col[idx])

if(show_axis){
axis(side = 2, at = c(plot_height_min[idx], plot_height[idx]), las = 2)
}else{
text(x = start, y = plot_height[idx], labels = paste0("[", plot_height_min[idx], "-", plot_height[idx], "]"), adj = 0, xpd = TRUE)
}
#plot(NA, xlim = c(start, end), ylim = c(0, nrow(regions)), frame.plot = FALSE, axes = FALSE, xlab = NA, ylab = NA)

if(plot_regions){
# boxcol = "#192a56"
if(nrow(x) > 0){
rect(xleft = regions[, startpos], ybottom = 0, xright = regions[, endpos], ytop = max(plot_height), col = boxcol, border = NA, xpd = TRUE)
}
}

if(track_names_to_left){
text(x = start, y = (plot_height_min[idx] + plot_height[idx])/2, labels = names(summary_list)[idx], adj = 1.1, cex = gene_fsize, xpd = TRUE)
}else{
title(main = names(summary_list)[idx], adj = track_names_pos, font.main = 3)
}
}
}
}else{
Expand Down Expand Up @@ -613,20 +646,8 @@ track_plot = function(summary_list = NULL,
# boxcol = "#192a56"
boxcol = grDevices::adjustcolor(boxcol, alpha.f = boxcolalpha)
if(nrow(regions) > 0){
for(i in 1:nrow(regions)){
if(idx == length(summary_list)){
#If its a last plot, draw rectangle till 0
rect(xleft = regions[i, startpos], ybottom = 0, xright = regions[i, endpos], ytop = plot_height[idx]+10, col = boxcol, border = NA, xpd = TRUE)
}else if (idx == 1){
if(ncol(regions) > 3){
text(x = mean(c(regions[i, startpos], regions[i, endpos])), y = plot_height[idx]+(plot_height[idx]*0.1), labels = regions[i, 4], adj = 0.5, xpd = TRUE, font = 1, cex = 1.2)
}else{
text(x = mean(c(regions[i, startpos], regions[i, endpos])), y = plot_height[idx]+(plot_height[idx]*0.1), labels = paste0(regions[i, startpos], "-", regions[i, endpos]), adj = 0.5, xpd = TRUE, font = 1, cex = 1.2)
}
rect(xleft = regions[i, startpos], ybottom = -10, xright = regions[i, endpos], ytop = plot_height[idx], col = boxcol, border = NA, xpd = TRUE)
}else{
rect(xleft = regions[i, startpos], ybottom = -10, xright = regions[i, endpos], ytop = plot_height[idx]+10, col = boxcol, border = NA, xpd = TRUE)
}
if(nrow(x) > 0){
rect(xleft = regions[, startpos], ybottom = 0, xright = regions[, endpos], ytop = max(plot_height), col = boxcol, border = NA, xpd = TRUE)
}
}
}
Expand Down Expand Up @@ -1622,8 +1643,11 @@ summarize_homer_annots = function(anno, sample_names = NULL, legend_font_size =

### Re-organize the layout by user specification
dt = data.table::data.table(name = plot_ord$name, ord = plot_ord$ord, ord_req = plot_ord$ord_req)

dt$n_tracks = ifelse(test = dt$name == 'b', yes = ntracks, no = 1)
#print(dt)
dt_s = split(dt, dt$n_tracks)
#print(dt_s)
if(length(dt_s) > 1){
dt_mult = dt_s[[2]]
dt_sing = dt_s[[1]]
Expand All @@ -1639,7 +1663,11 @@ summarize_homer_annots = function(anno, sample_names = NULL, legend_font_size =
dt = dt[order(ord_req)]
data = dt$ord_req4
}else{
dt = data.table::data.table(name = rep(dt$name, dt$n_tracks), ord = dt$ord, ord_req = dt$ord_req, ord_req2 = seq(dt$ord_req, dt$ord_req + dt$n_tracks -1 , 1), n_tracks = dt$n_tracks)
#ifelse(test = dt$n_tracks > 1, )
#print(dt)
dt = data.table::data.table(name = rep(dt$name, dt$n_tracks), ord = dt$ord, ord_req = dt$ord_req, ord_req2 = dt$ord_req, n_tracks = dt$n_tracks)
#print(dt)

dt = split(dt, dt$ord) |> data.table::rbindlist()
dt[, ord_req4 := 1:nrow(dt)]
dt = dt[order(ord_req)]
Expand Down Expand Up @@ -1686,6 +1714,8 @@ summarize_homer_annots = function(anno, sample_names = NULL, legend_font_size =
window_dat$chr = chr
window_dat = window_dat[, .(chr, start, end)]

print(window_dat)

op_dir = paste0(op_dir, "/")

if(!dir.exists(paths = op_dir)){
Expand Down
27 changes: 19 additions & 8 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,14 @@ Why `trackplot`?

* For centOS or debian: Follow these [compilation instructions](https://gist.github.com/PoisonAlien/e19b482ac6146bfb03142a0de1c4fbc8).

### Citation

If you find the script useful consider citing [trackplot](https://academic.oup.com/bioinformaticsadvances/article/4/1/vbae031/7616126) and [bwtool](https://academic.oup.com/bioinformatics/article/30/11/1618/282756)

**_Mayakonda A, and Frank Westermann. Trackplot: a fast and lightweight R script for epigenomic enrichment plots. Bioinformatics advances vol. 4,1 vbae031. 28 Feb. 2024. PMID: [38476298](https://pubmed.ncbi.nlm.nih.gov/38476298/)_**

**_Pohl A, Beato M. bwtool: a tool for bigWig files. Bioinformatics. 2014 Jun 1;30(11):1618-9. doi: 10.1093/bioinformatics/btu056. Epub 2014 Jan 30. PMID: [24489365](https://pubmed.ncbi.nlm.nih.gov/24489365/)_**

## Usage

Simple usage - Make a table of all the bigWig files to be analysed with `read_coldata()` and pass it to the downstream functions.
Expand Down Expand Up @@ -113,6 +121,17 @@ track_plot(summary_list = t,

![](https://github.com/PoisonAlien/trackplot/assets/8164062/a0911998-aae8-4de1-96f5-18e278d19d80)

#### Collapse all tracks into a single track

Use `track_overlay = TRUE` to overlay all tracks into a single line track

```r
track_plot(summary_list = t, col = track_cols, show_ideogram = FALSE, track_overlay = TRUE)
```

![](https://github.com/user-attachments/assets/d286f159-8950-4209-a985-fa3ba7103c53)


#### Heighilight regions of interest (any bed files would do)

```r
Expand Down Expand Up @@ -292,14 +311,6 @@ profile_heatmap(mat_list = pe_bed, top_profile = TRUE, zmaxs = 0.8)
* Windows OS is not supported


### Citation

If you find the script useful consider citing [trackplot](https://academic.oup.com/bioinformaticsadvances/article/4/1/vbae031/7616126) and [bwtool](https://academic.oup.com/bioinformatics/article/30/11/1618/282756)

**_Mayakonda, Anand, and Frank Westermann. Trackplot: a fast and lightweight R script for epigenomic enrichment plots. Bioinformatics advances vol. 4,1 vbae031. 28 Feb. 2024. PMID: [38476298](https://pubmed.ncbi.nlm.nih.gov/38476298/)_**

**_Pohl A, Beato M. bwtool: a tool for bigWig files. Bioinformatics. 2014 Jun 1;30(11):1618-9. doi: 10.1093/bioinformatics/btu056. Epub 2014 Jan 30. PMID: [24489365](https://pubmed.ncbi.nlm.nih.gov/24489365/)_**

### Acknowledgements

[Joschka Hey](https://github.com/HeyLifeHD) for all the cool suggestions :)
10 changes: 10 additions & 0 deletions inst/CITATION
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
bibentry(
bibtype = "Article",
title = "Trackplot: a fast and lightweight R script for epigenomic enrichment plots",
author = personList(as.person("Anand Mayakonda"),
as.person("Frank Westermann")),
journal = "Bioinformatics Advances",
year = "2024",
volume = "4",
doi = "doi.org/10.1093/bioadv/vbae031"
)
7 changes: 5 additions & 2 deletions man/track_plot.Rd

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

24 changes: 24 additions & 0 deletions vignettes/trackplot.Rmd
Original file line number Diff line number Diff line change
Expand Up @@ -115,6 +115,13 @@ track_cols = c("#d35400","#d35400","#2980b9","#2980b9","#2980b9", "#27ae60","#27
track_plot(summary_list = t_loci, col = track_cols)
```

### Collapse all tracks into a single track

```{r}
track_plot(summary_list = t_loci, track_overlay = T, col = track_cols, show_ideogram = FALSE, genename = c("POU5F1", "TCF19"), gene_track_height = 1)
```


### Heighlight sites at the top

Using BED files or data.frame in BED format to heightlight target regions of interest
Expand All @@ -130,6 +137,8 @@ track_plot(
)
```



### Show only specific genes

Use `genename` argument to show only specific genes in the gene track
Expand Down Expand Up @@ -192,6 +201,21 @@ track_plot(
)
```

## Overlay tracks

```{r}
#Re-organize the layout in the order chromHMM track, gene track, cytoband track, bigWig tracks and peak track.
track_plot(
summary_list = t_loci,
col = track_cols,
peaks = tf_beds,
peaks_track_names = c("NANOG", "OCT4"),
genename = c("POU5F1", "TCF19"),
chromHMM = h1_chrHMM,
chromHMM_names = "H1", layout_ord = c("h", "g", "c", "b", "p"), track_overlay = TRUE
)
```

## Peak files as input

All of the above plots can also be generated with [narrowPeak](https://genome.ucsc.edu/FAQ/FAQformat.html#format12) or [broadPeak](https://genome.ucsc.edu/FAQ/FAQformat.html#format13) files as input. Here, 5th column containing scores are plotted as intensity. Color coding and binning of scores are as per [UCSC convention](https://genome.ucsc.edu/FAQ/FAQformat.html#format1)
Expand Down

0 comments on commit 8c4aaa1

Please sign in to comment.