annotate 08_sequence_length_distribution.Rmd @ 1:92e3de11b9f8 draft

remove fastqc_report.Rmd
author mingchen0919
date Tue, 27 Feb 2018 10:40:20 -0500
parents b7c115edd970
children c64267b9f754
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
1 ---
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
2 output: html_document
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
3 ---
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
4
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
5 ```{r setup, include=FALSE, warning=FALSE, message=FALSE}
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
6 knitr::opts_chunk$set(
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
7 echo = as.logical(opt$X_e),
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
8 error = TRUE,
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
9 eval = TRUE
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
10 )
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
11 ```
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
12
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
13 # Sequence Length Distribution
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
14
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
15 ```{r 'Sequence Length Distribution', fig.width=10}
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
16 ## reads 1
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
17 sld_1 = extract_data_module(paste0(opt$X_d, '/read_1_fastqc/fastqc_data.txt'), 'Sequence Length Distribution')
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
18 sld_1$id = 1:length(sld_1$X.Length)
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
19 sld_1$trim = 'before'
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
20
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
21 ## reads 2
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
22 sld_2 = extract_data_module(paste0(opt$X_d, '/read_2_fastqc/fastqc_data.txt'), 'Sequence Length Distribution')
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
23 sld_2$id = 1:length(sld_2$X.Length)
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
24 sld_2$trim = 'after'
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
25
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
26 comb_sld = rbind(sld_1, sld_2)
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
27 comb_sld$trim = factor(levels = c('before', 'after'), comb_sld$trim)
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
28
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
29 p = ggplot(data = comb_sld, aes(x = id, y = Count)) +
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
30 geom_line(color = 'red') +
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
31 scale_x_continuous(breaks = sld_2$id, labels = sld_2$X.Length) +
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
32 facet_grid(. ~ trim) +
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
33 xlab('Sequence Length (bp)') +
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
34 ylab('') +
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
35 theme(axis.text.x = element_text(angle=45))
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
36 ggplotly(p)
b7c115edd970 planemo upload
mingchen0919
parents:
diff changeset
37 ```