Mercurial > repos > mingchen0919 > aurora_fastqc_site
annotate 09_sequence_duplication_levels.Rmd @ 2:c64267b9f754 draft default tip
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
| author | mingchen0919 |
|---|---|
| date | Sun, 30 Dec 2018 12:48:14 -0500 |
| parents | b7c115edd970 |
| children |
| rev | line source |
|---|---|
| 0 | 1 --- |
| 2 output: html_document | |
| 3 --- | |
| 4 | |
| 5 ```{r setup, include=FALSE, warning=FALSE, message=FALSE} | |
|
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
6 knitr::opts_knit$set(progress = FALSE) |
|
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
7 knitr::opts_chunk$set(error = TRUE, echo = FALSE) |
| 0 | 8 ``` |
| 9 | |
| 10 | |
|
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
11 ### Sequence Duplication Levels |
| 0 | 12 |
| 13 ```{r 'Sequence Duplication Levels', fig.width=10} | |
| 14 ## reads 1 | |
| 15 sdl_1 = extract_data_module(paste0(opt$X_d, '/read_1_fastqc/fastqc_data.txt'), 'Sequence Duplication Levels', header = FALSE, comment.char = '#') | |
| 16 names(sdl_1) = c('Duplication_Level', 'Percentage_of_deduplicated', 'Percentage_of_total') | |
| 17 sdl_1$id = 1:length(sdl_1$Duplication_Level) | |
| 18 | |
| 19 melt_sdl_1 = melt(sdl_1, id=c('Duplication_Level', 'id')) | |
| 20 melt_sdl_1$trim = 'before' | |
| 21 | |
| 22 | |
| 23 ## reads 2 | |
| 24 sdl_2 = extract_data_module(paste0(opt$X_d, '/read_2_fastqc/fastqc_data.txt'), 'Sequence Duplication Levels', header = FALSE, comment.char = '#') | |
| 25 names(sdl_2) = c('Duplication_Level', 'Percentage_of_deduplicated', 'Percentage_of_total') | |
| 26 sdl_2$id = 1:length(sdl_2$Duplication_Level) | |
| 27 | |
| 28 melt_sdl_2 = melt(sdl_2, id=c('Duplication_Level', 'id')) | |
| 29 melt_sdl_2$trim = 'after' | |
| 30 | |
| 31 comb_sdl = rbind(melt_sdl_1, melt_sdl_2) | |
| 32 comb_sdl$trim = factor(levels = c('before', 'after'), comb_sdl$trim) | |
| 33 | |
|
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
34 p = ggplot(data = comb_sdl) + |
|
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
35 geom_line(mapping = aes(x = id, y = value, color = variable)) + |
| 0 | 36 scale_x_continuous(breaks = sdl_2$id, labels = sdl_2$Duplication_Level) + |
| 37 facet_grid(. ~ trim) + | |
| 38 xlab('Sequence Duplication Level') + | |
| 39 ylab('') + | |
|
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
40 scale_color_discrete(name = '') + |
|
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
41 theme(axis.text.x = element_text(size = 5), |
|
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
42 panel.background = element_rect(fill = NA), |
|
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
43 axis.line = element_line()) |
|
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
44 p |
|
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
45 ``` |
