Mercurial > repos > mingchen0919 > aurora_skewer_site

diff 01_skewer_analysis.Rmd @ 0:a42e58c71e5b draft default tip
planemo upload commit 841d8b22bf9f1aaed6bfe8344b60617f45b275b2-dirty
author: mingchen0919
date: Sun, 30 Dec 2018 12:55:49 -0500
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/01_skewer_analysis.Rmd	Sun Dec 30 12:55:49 2018 -0500
@@ -0,0 +1,65 @@
+---
+title: 'Skewer Analysis'
+output:
+    html_document:
+      highlight: pygments
+---
+
+```{r setup, include=FALSE, warning=FALSE, message=FALSE}
+knitr::opts_chunk$set(error = TRUE, echo = FALSE)
+```
+
+
+## Job script
+
+```{bash echo=FALSE}
+sh ${TOOL_INSTALL_DIR}/build-and-run-job-scripts.sh
+```
+
+```{r echo=FALSE,warning=FALSE,results='asis'}
+# display content of the job-script.sh file.
+cat('```bash\n')
+cat(readLines(paste0(Sys.getenv('REPORT_FILES_PATH'), '/job-1-script.sh')), sep = '\n')
+cat('\n```')
+```
+
+
+# Results summary
+
+## Reads processing summary
+
+```{r echo=TRUE}
+log = readLines(paste0(Sys.getenv('REPORT_FILES_PATH'), '/trim-trimmed.log'))
+start_line = grep('read.+processed; of these:', log)
+end_line = grep('untrimmed.+available after processing', log)
+processing_summary = gsub('(\\d+) ', '\\1\t', log[start_line:end_line])
+processing_summary_df = do.call(rbind, strsplit(processing_summary, '\t'))
+colnames(processing_summary_df) = c('Total reads:', processing_summary_df[1,1])
+knitr::kable(processing_summary_df[-1, ])
+```
+
+## Length distribution of reads after trimming
+
+```{r echo=TRUE, message=FALSE, warning=FALSE}
+start_line = grep('length	count	percentage', log)
+len_dist = log[(start_line):length(log)]
+len_dist = do.call(rbind, strsplit(len_dist, '\t'))
+columns = len_dist[1, ]
+len_dist = as.data.frame(len_dist[-1, ])
+colnames(len_dist) = columns
+
+library(plotly)
+library(ggplot2)
+len_dist$count = as.numeric(len_dist$count)
+labels = as.character(len_dist$length)
+len_dist$length = 1:nrow(len_dist)
+pp = ggplot(data = len_dist, aes(length, count)) +
+  geom_line(color='red') +
+  scale_x_continuous(name = 'Length',
+                   breaks = 1:nrow(len_dist),
+                   labels = labels) +
+  theme(axis.text.x = element_text(angle = 90, hjust = 1)) +
+  ylab('Count') +
+  ggtitle('Length distribution')
+ggplotly(pp)
+```
\ No newline at end of file
author	mingchen0919
date	Sun, 30 Dec 2018 12:55:49 -0500
parents
children