changeset 0:c1f718dd6c7a draft

planemo upload
author mingchen0919
date Sat, 30 Dec 2017 00:25:38 -0500
parents
children 629323b5fc0c
files rmarkdown_deseq2_count_matrix.Rmd rmarkdown_deseq2_count_matrix.xml rmarkdown_deseq2_count_matrix_render.R
diffstat 3 files changed, 195 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/rmarkdown_deseq2_count_matrix.Rmd	Sat Dec 30 00:25:38 2017 -0500
@@ -0,0 +1,39 @@
+---
+title: 'DESeq2 analysis'
+output:
+    html_document:
+      number_sections: true
+      toc: true
+      theme: cosmo
+      highlight: tango
+---
+
+```{r setup, include=FALSE, warning=FALSE, message=FALSE}
+knitr::opts_chunk$set(
+  echo = opt$echo,
+  error = TRUE
+)
+```
+
+
+## User input
+
+```{r 'user input'}
+df = data.frame(name = names(opt)[-1],
+                value = unlist(opt))
+df
+```
+
+
+## Count Matrix
+
+```{r 'count matrix'}
+count_data = read.table(opt$count_data)
+head(count_data, 10)
+```
+
+```{r 'ste[ 2'}
+
+```
+
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/rmarkdown_deseq2_count_matrix.xml	Sat Dec 30 00:25:38 2017 -0500
@@ -0,0 +1,73 @@
+<tool id="rmarkdown_deseq2_count_matrix" name="DESeq2 (count matrix)" version="1.0.0">
+    <requirements>
+        <requirement type="package" version="1.15.0.6-0">pandoc</requirement>
+        <requirement type="package" version="1.20.0">r-getopt</requirement>
+        <requirement type="package" version="1.3">r-rmarkdown</requirement>
+        <requirement type="package" version="0.3.5">r-htmltools</requirement>
+        <requirement type="package" version="0.5.0">r-dplyr</requirement>
+        <requirement type="package" version="1.14.1">bioconductor-deseq2</requirement>
+        <requirement type="package" version="0.2">r-dt</requirement>
+    </requirements>
+    <description>deseq2 analysis given a count matrix input</description>
+    <stdio>
+        <regex source="stderr" match="XXX" level="warning"
+               description="Check the warnings_and_errors.txt file for more details."/>
+    </stdio>
+    <command><![CDATA[
+Rscript '${__tool_directory__}/rmarkdown_deseq2_count_matrix_render.R'
+                        -e $echo
+                        -c $count_data
+                        -C $col_data
+                        -D '$design_formula'
+                        -k $contrast_condition
+                        -T $treatment
+                        -k $control
+                        -r $report
+                        -d $report.files_path
+                        -s $sink_message
+                        -t '${__tool_directory__}/rmarkdown_deseq2_count_matrix.Rmd'
+                    ]]></command>
+    <inputs>
+        <param type="boolean" name="echo" label="Display analysis code in report?" optional="False" checked="False"
+               truevalue="TRUE" falsevalue="FALSE"/>
+        <param type="data" name="count_data" label="count data" optional="False" format="txt,csv" multiple="False"/>
+        <param type="data" name="col_data" label="column data" optional="False" format="txt,csv" multiple="False"/>
+        <param type="text" name="design_formula" label="design formula"
+               help="The simplest design formula for differential expression would be ~ condition, where condition&#13;&#10;                     is a column in colData(dds) that specifies which of two (or more groups) the samples belong to"
+               optional="False" value="~ condition_1 + condition_2"/>
+        <param type="text" name="contrast_condition" label="condition"
+               help="A condition name specified in the design formula" optional="False" value="condition_1"/>
+        <param type="text" name="treatment" label="treatment" help="the name of the numerator level for the fold change"
+               optional="False"/>
+        <param type="text" name="control" label="control" help="the name of the denominator level for the fold change"
+               optional="False"/>
+    </inputs>
+    <outputs>
+        <data name="report" format="html" label="DESeq2 report" hidden="false"/>
+        <data name="differential_genes" format="csv" label="differential genes" from_work_dir="differential_genes.csv"
+              hidden="false"/>
+        <data name="sink_message" format="txt" label="Warnings and Errors" from_work_dir="warnings_and_errors.txt"
+              hidden="false"/>
+    </outputs>
+    <help><![CDATA[See http://bioconductor.org/packages/devel/bioc/vignettes/DESeq2/inst/doc/DESeq2.html]]></help>
+    <citations>
+        <citation type="bibtex"><![CDATA[            @article{love2014moderated,
+            title={Moderated estimation of fold change and dispersion for RNA-seq data with DESeq2},
+            author={Love, Michael I and Huber, Wolfgang and Anders, Simon},
+            journal={Genome biology},
+            volume={15},
+            number={12},
+            pages={550},
+            year={2014},
+            publisher={BioMed Central}
+            }]]></citation>
+        <citation type="bibtex"><![CDATA[            @article{allaire2016rmarkdown,
+            title={rmarkdown: Dynamic Documents for R, 2016},
+            author={Allaire, J and Cheng, Joe and Xie, Yihui and McPherson, Jonathan and Chang, Winston and Allen, Jeff
+            and Wickham, Hadley and Atkins, Aron and Hyndman, Rob},
+            journal={R package version 0.9},
+            volume={6},
+            year={2016}
+            }]]></citation>
+    </citations>
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/rmarkdown_deseq2_count_matrix_render.R	Sat Dec 30 00:25:38 2017 -0500
@@ -0,0 +1,83 @@
+library(getopt)
+library(rmarkdown)
+library(htmltools)
+library(dplyr)
+
+##============ Sink warnings and errors to a file ==============
+## use the sink() function to wrap all code within it.
+##==============================================================
+zz = file('warnings_and_errors.txt')
+sink(zz)
+sink(zz, type = 'message')
+  ##---------below is the code for rendering .Rmd templates-----
+
+  ##=============STEP 1: handle command line arguments==========
+  ##
+  ##============================================================
+  # column 1: the long flag name
+  # column 2: the short flag alias. A SINGLE character string
+  # column 3: argument mask
+  #           0: no argument
+  #           1: argument required
+  #           2: argument is optional
+  # column 4: date type to which the flag's argument shall be cast.
+  #           possible values: logical, integer, double, complex, character.
+  #-------------------------------------------------------------
+  #++++++++++++++++++++ Best practice ++++++++++++++++++++++++++
+  # 1. short flag alias should match the flag in the command section in the XML file.
+  # 2. long flag name can be any legal R variable names
+  # 3. two names in args_list can have common string but one name should not be a part of another name.
+  #    for example, one name is "ECHO", if another name is "ECHO_XXX", it will cause problems.
+  #+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
+  args_list=list()
+  ##------- 1. input data ---------------------
+  args_list$ECHO = c('echo', 'e', '1', 'character')
+  args_list$c = c('count_data', 'c', '1', 'character')
+  args_list$C = c('col_data', 'C', '1', 'character')
+  args_list$D = c('design_formula', 'D', '1', 'character')
+  args_list$k = c('contrast_condition', 'k', '1', 'character')
+  args_list$T = c('treatment', 'T', '1', 'character')
+  args_list$K = c('control', 'K', '1', 'character')
+  ##--------2. output report and outputs --------------
+  args_list$REPORT_HTML = c('report_html', 'r', '1', 'character')
+  args_list$REPORT_DIR = c('report_dir', 'd', '1', 'character')
+  args_list$SINK_MESSAGE = c('sink_message', 's', '1', 'character')
+  ##--------3. .Rmd templates in the tool directory ----------
+  args_list$TOOL_TEMPLATE_RMD = c('tool_template_rmd', 't', '1', 'character')
+  ##-----------------------------------------------------------
+  opt = getopt(t(as.data.frame(args_list)))
+
+
+
+  ##=======STEP 2: create report directory (optional)==========
+  ##
+  ##===========================================================
+  dir.create(opt$report_dir)
+
+  ##=STEP 3: replace placeholders in .Rmd with argument values=
+  ##
+  ##===========================================================
+  #++ need to replace placeholders with args values one by one+
+  readLines(opt$tool_template_rmd) %>%
+    # (function(x) {
+    #   gsub('ECHO', opt$echo, x)
+    # }) %>%
+    # (function(x) {
+    #   gsub('REPORT_DIR', opt$report_dir, x)
+    # }) %>%
+    (function(x) {
+      fileConn = file('tool_template.Rmd')
+      writeLines(x, con=fileConn)
+      close(fileConn)
+    })
+
+
+  ##=============STEP 4: render .Rmd templates=================
+  ##
+  ##===========================================================
+  render('tool_template.Rmd', output_file = opt$report_html)
+
+
+  ##--------end of code rendering .Rmd templates----------------
+sink()
+##=========== End of sinking output=============================