Repository 'rmarkdown_fastqc_site'
hg clone https://toolshed.g2.bx.psu.edu/repos/mingchen0919/rmarkdown_fastqc_site

Changeset 12:68ea2ebbf866 (2017-11-09)
Previous changeset 11:507eec497730 (2017-11-07) Next changeset 13:6faa68239cd7 (2017-11-09)
Commit message:
add boxplot for per base sequence quality
modified:
02_per_base_sequence_quality.Rmd
b
diff -r 507eec497730 -r 68ea2ebbf866 02_per_base_sequence_quality.Rmd
--- a/02_per_base_sequence_quality.Rmd Tue Nov 07 16:52:24 2017 -0500
+++ b/02_per_base_sequence_quality.Rmd Thu Nov 09 09:23:43 2017 -0500
b
@@ -21,27 +21,32 @@
 ## reads 1
 pbsq_1 = extract_data_module('REPORT_DIR/reads_1_fastqc_data.txt', 'Per base sequence quality')
 pbsq_1$id = 1:length(pbsq_1$X.Base)
-
-melt_pbsq_1 = filter(melt(pbsq_1, id=c('X.Base', 'id')), variable == 'Mean')
-melt_pbsq_1$trim = 'before'
-
+pbsq_1$trim = 'before'
 
 ## reads 2
 pbsq_2 = extract_data_module('REPORT_DIR/reads_2_fastqc_data.txt', 'Per base sequence quality')
 pbsq_2$id = 1:length(pbsq_2$X.Base)
+pbsq_2$trim = 'after'
 
-melt_pbsq_2 = filter(melt(pbsq_2, id=c('X.Base', 'id')), variable == 'Mean')
-melt_pbsq_2$trim = 'after'
-
-comb_pbsq = rbind(melt_pbsq_1, melt_pbsq_2)
+comb_pbsq = rbind(pbsq_1, pbsq_2)
 comb_pbsq$trim = factor(levels = c('before', 'after'), comb_pbsq$trim)
 
 p = ggplot(data = comb_pbsq) +
-  geom_line(mapping = aes(x = id, y = value, group = variable, color = variable)) +
-  scale_x_continuous(breaks = pbsq_2$id, labels = pbsq_2$X.Base) + 
-  facet_grid(. ~ trim) + 
-  ylim(0, max(comb_pbsq$value) + 5) +
+  geom_boxplot(mapping = aes(x = id, 
+                             lower = Lower.Quartile, 
+                             upper = Upper.Quartile, 
+                             middle = Median, 
+                             ymin = X10th.Percentile, 
+                             ymax = X90th.Percentile,
+                             fill = "yellow"),
+               stat = 'identity') +
+  geom_line(mapping = aes(x = id, y = Mean, color = "red")) +
+  scale_x_continuous(breaks = pbsq_2$id, labels = pbsq_2$X.Base) +
+  scale_fill_identity() +
+  scale_color_identity() + 
+  ylim(0, max(comb_pbsq$Upper.Quartile) + 5) +
+  facet_grid(. ~ trim) +
   theme(axis.text.x = element_text(angle=45))
-ggplotly(p)
+p
 
 ```
\ No newline at end of file