comparison 02_per_base_sequence_quality.Rmd @ 11:507eec497730 draft

update fastqc site
author mingchen0919
date Tue, 07 Nov 2017 16:52:24 -0500
parents
children 68ea2ebbf866
comparison
equal deleted inserted replaced
10:600c39b11913 11:507eec497730
1 ---
2 title: 'Per base sequence quality'
3 output:
4 html_document:
5 number_sections: true
6 toc: true
7 theme: cosmo
8 highlight: tango
9 ---
10
11 ```{r setup, include=FALSE, warning=FALSE, message=FALSE}
12 knitr::opts_chunk$set(
13 echo = ECHO,
14 error = TRUE
15 )
16 ```
17
18 ### Per base sequence quality
19
20 ```{r 'per base sequence quality', fig.width=10}
21 ## reads 1
22 pbsq_1 = extract_data_module('REPORT_DIR/reads_1_fastqc_data.txt', 'Per base sequence quality')
23 pbsq_1$id = 1:length(pbsq_1$X.Base)
24
25 melt_pbsq_1 = filter(melt(pbsq_1, id=c('X.Base', 'id')), variable == 'Mean')
26 melt_pbsq_1$trim = 'before'
27
28
29 ## reads 2
30 pbsq_2 = extract_data_module('REPORT_DIR/reads_2_fastqc_data.txt', 'Per base sequence quality')
31 pbsq_2$id = 1:length(pbsq_2$X.Base)
32
33 melt_pbsq_2 = filter(melt(pbsq_2, id=c('X.Base', 'id')), variable == 'Mean')
34 melt_pbsq_2$trim = 'after'
35
36 comb_pbsq = rbind(melt_pbsq_1, melt_pbsq_2)
37 comb_pbsq$trim = factor(levels = c('before', 'after'), comb_pbsq$trim)
38
39 p = ggplot(data = comb_pbsq) +
40 geom_line(mapping = aes(x = id, y = value, group = variable, color = variable)) +
41 scale_x_continuous(breaks = pbsq_2$id, labels = pbsq_2$X.Base) +
42 facet_grid(. ~ trim) +
43 ylim(0, max(comb_pbsq$value) + 5) +
44 theme(axis.text.x = element_text(angle=45))
45 ggplotly(p)
46
47 ```