Mercurial > repos > mingchen0919 > aurora_fastqc_site
annotate 09_sequence_duplication_levels.Rmd @ 2:c64267b9f754 draft default tip
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
author | mingchen0919 |
---|---|
date | Sun, 30 Dec 2018 12:48:14 -0500 |
parents | b7c115edd970 |
children |
rev | line source |
---|---|
0 | 1 --- |
2 output: html_document | |
3 --- | |
4 | |
5 ```{r setup, include=FALSE, warning=FALSE, message=FALSE} | |
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
6 knitr::opts_knit$set(progress = FALSE) |
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
7 knitr::opts_chunk$set(error = TRUE, echo = FALSE) |
0 | 8 ``` |
9 | |
10 | |
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
11 ### Sequence Duplication Levels |
0 | 12 |
13 ```{r 'Sequence Duplication Levels', fig.width=10} | |
14 ## reads 1 | |
15 sdl_1 = extract_data_module(paste0(opt$X_d, '/read_1_fastqc/fastqc_data.txt'), 'Sequence Duplication Levels', header = FALSE, comment.char = '#') | |
16 names(sdl_1) = c('Duplication_Level', 'Percentage_of_deduplicated', 'Percentage_of_total') | |
17 sdl_1$id = 1:length(sdl_1$Duplication_Level) | |
18 | |
19 melt_sdl_1 = melt(sdl_1, id=c('Duplication_Level', 'id')) | |
20 melt_sdl_1$trim = 'before' | |
21 | |
22 | |
23 ## reads 2 | |
24 sdl_2 = extract_data_module(paste0(opt$X_d, '/read_2_fastqc/fastqc_data.txt'), 'Sequence Duplication Levels', header = FALSE, comment.char = '#') | |
25 names(sdl_2) = c('Duplication_Level', 'Percentage_of_deduplicated', 'Percentage_of_total') | |
26 sdl_2$id = 1:length(sdl_2$Duplication_Level) | |
27 | |
28 melt_sdl_2 = melt(sdl_2, id=c('Duplication_Level', 'id')) | |
29 melt_sdl_2$trim = 'after' | |
30 | |
31 comb_sdl = rbind(melt_sdl_1, melt_sdl_2) | |
32 comb_sdl$trim = factor(levels = c('before', 'after'), comb_sdl$trim) | |
33 | |
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
34 p = ggplot(data = comb_sdl) + |
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
35 geom_line(mapping = aes(x = id, y = value, color = variable)) + |
0 | 36 scale_x_continuous(breaks = sdl_2$id, labels = sdl_2$Duplication_Level) + |
37 facet_grid(. ~ trim) + | |
38 xlab('Sequence Duplication Level') + | |
39 ylab('') + | |
2
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
40 scale_color_discrete(name = '') + |
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
41 theme(axis.text.x = element_text(size = 5), |
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
42 panel.background = element_rect(fill = NA), |
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
43 axis.line = element_line()) |
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
44 p |
c64267b9f754
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
mingchen0919
parents:
0
diff
changeset
|
45 ``` |