rnaspades: rnaspades.xml comparison

comparison rnaspades.xml @ 6:b66de1e9abfb draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/spades commit 8734db131db6f76697b500b30f18ee7723d61813"

author	iuc
date	Sun, 23 Jan 2022 21:32:25 +0000
parents	1035adb112c0
children	675ee1aa5952

comparison

equal deleted inserted replaced

-:1035adb112c0
+:b66de1e9abfb
-<tool id="rnaspades" name="rnaSPAdes" version="3.9.0.3">
+<tool id="rnaspades" name="rnaSPAdes" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.01">
-<description>assembler for RNA-Seq data</description>
+<description>de novo transcriptome assembler</description>
-<xrefs>
+<macros>
-<xref type="bio.tools">rnaspades</xref>
+<import>macros.xml</import>
-</xrefs>
+</macros>
-<requirements>
+<expand macro="requirements"/>
-<requirement type="package" version="3.9.0">spades</requirement>
+<expand macro="stdio"/>
-</requirements>
+<expand macro="version_command"/>
-<command detect_errors="exit_code">
+<command detect_errors="exit_code"><![CDATA[
-<![CDATA[
+#set $library = 1
-if [ -n "\$GALAXY_MEMORY_MB" ]; then
-GALAXY_MEMORY_GB=\$(( GALAXY_MEMORY_MB / 1024 ));
+@PREPROCESS_INPUT_FILES_MAIN@
-fi &&
+#if $additional_reads.selector == 'true'
+@PREPROCESS_INPUT_FILES_ADDITIONAL@
-rnaspades.py -o .
+#end if
-## Forces unzipped output, faster
+@PREPROCESS_NANOPORE_PACBIO_FILES@
---disable-gzip-output
+@PREPROCESS_CONTIGS_FILES@
-$draft $onlyassembler -t \${GALAXY_SLOTS:-4} -m \${GALAXY_MEMORY_GB:-250} $iontorrent -k $kmer
+@PREPROCESS_FL_RNA_FILES@
-## Sequence files, libraries
-#for $i, $library in enumerate( $libraries, start=1 ):
-#if str( $library.lib_type ) == "paired_end":
+## run
-#set prefix = 'pe'
+rnaspades.py
-#elif str( $library.lib_type ) == "mate_paired":
+-o 'output'
-#set prefix = 'mp'
+@RESOURCES@
-#elif str( $library.lib_type ) == "nxmate_paired":
+@INPUT_READS_MAIN@
-#set prefix = 'nxmate'
+#if $additional_reads.selector == 'true'
-#else:
+@INPUT_READS_ADDITIONAL@
-#set prefix = 'hqmp'
+#end if
-#end if
+## additional reads
---$prefix$i-$library.orientation
+@FL_RNA@
-#for $file in $library.files
+@NANOPORE_PACBIO@
-#if $file.file_type.type == "separate":
+@CONTIGS@
---$prefix$i-1 fastq:$file.file_type.fwd_reads
+## parameter
---$prefix$i-2 fastq:$file.file_type.rev_reads
+@KMER@
-#elif $file.file_type.type == "interleaved":
+@PIPELINE_OPTIONS@
---$prefix$i-12 fastq:$file.file_type.interleaved_reads
+@PHREDOFFSET@
-#elif $file.file_type.type == "unpaired":
+#if $ss != 'no'
---$prefix$i-s fastq:$file.file_type.unpaired_reads
+--ss '$ss'
-#elif $file.file_type.type == "paired-collection":
+#end if
---$prefix$i-1 fastq:$file.file_type.fastq_collection.forward
+## postprocessing
---$prefix$i-2 fastq:$file.file_type.fastq_collection.reverse
+@CORRECTED@
-#end if
+]]></command>
-#end for
-#end for
-#for $contig in $trusted_contigs:
-#if $contig:
---trusted-contigs $contig.extension:$contig
-#end if
-#end for
-#for $contig in $untrusted_contigs:
-#if $contig:
---untrusted-contigs $contig.extension:$contig
-#end if
-#end for
-]]>
-</command>
 <inputs>
-<param argument="--draft-assembly" checked="False" falsevalue="" label="Draft assembly. Faster, but more error-prone" name="draft" truevalue="--draft-assembly" type="boolean" />
+<expand macro="input_files_all" format="fastq,fastq.gz,fastqsanger.gz,fasta,fasta.gz" label="FASTQ RNA-seq file(s)"/>
-<param argument="--only-assembler" checked="False" falsevalue="" label="Run only assembly? (without read error correction)" name="onlyassembler" truevalue="--only-assembler" type="boolean" />
+<expand macro="input_additional_files_all" format="fastq,fastq.gz,fastqsanger.gz,fasta,fasta.gz" label="FASTQ RNA-seq file(s)"/>
-<param argument="--iontorrent" checked="False" falsevalue="" label="Libraries are IonTorrent reads?" name="iontorrent" truevalue="--iontorrent" type="boolean" />
+<section name="arf" title="Additional read files">
-<param argument="-k" max="127" label="k-mer size (must be odd and less than 128)" name="kmer" type="integer" value="55" />
+<expand macro="flrna"/>
-<repeat help="It is not possible to specify only mate-pair libraries. Scaffolds are not produced if neither a paired-end nor a mate-pair library is provided." min="1" name="libraries" title="Libraries">
+<expand macro="nanopore_pacbio"/>
-<param label="Library type" name="lib_type" type="select">
+<expand macro="contigs"/>
-<option value="paired_end">Paired-end / Single reads</option>
+</section>
-<option value="mate_paired">Mate pairs</option>
+<expand macro="kmer" help="By default rnaSPAdes uses 2 k-mer sizes, which are automatically detected using read length (approximately one third and half of the maximal read length). We recommend not to change this parameter because smaller k-mer sizes typically result in multiple chimeric (misassembled) transcripts."/>
-<option value="high_mate_paired">High Quality Mate pairs</option>
+<expand macro="phred"/>
-<option value="nxmate_paired">Lucigen NxMate pairs</option>
+<param argument="--ss" type="select" label="Set strand specificity" help="rnaSPAdes supports strand-specific RNA-Seq datasets. Use 'RF' when first read in pair corresponds to reverse gene strand (antisense data, e.g. obtained via dUTP protocol) and 'FR' otherwise.  If the dataset is single-end use 'FR' option in case when reads correspond to gene strand and 'RF' otherwise. Note: strand-specificity is not related and should not be confused with FR and RF orientation of paired reads. RNA-Seq paired-end reads typically have forward-reverse orientation, which is assumed by default and no additional options are needed">
-</param>
+<option value="no" selected="true">Disabled</option>
-<param label="Orientation" name="orientation" type="select">
+<option value="fr">FR (normal)</option>
-<option selected="true" value="fr">-&gt; &lt;- (fr)</option>
+<option value="rf">RF (antisense)</option>
-<option value="rf"><![CDATA[<- -> (rf)]]></option>
+</param>
-<option value="ff"><![CDATA[-> -> (ff)]]></option>
+<expand macro="pipeline_options">
-</param>
+<option value="--iontorrent">Iontorrent: although rnaSPAdes supports IonTorrent reads, it was not sufficiently tested on such kind of data (--iontorrent)</option>
-<repeat min="1" name="files" title="Files">
+</expand>
-<conditional name="file_type">
+<param name="optional_output" type="select" multiple="true" optional="false" label="Select optional output file(s)" help="Only shown in history if selected here and generated by the specific run.">
-<param label="Select file format" name="type" type="select">
+<option value="hft">Hard filtered transcripts</option>
-<option value="separate">Separate input files</option>
+<option value="l">Log</option>
-<option value="interleaved">Interleaved files</option>
+<option value="sft">Soft filtered transcripts</option>
-<option value="unpaired">Unpaired/Single reads</option>
+<option value="tr" selected="true">Transcripts</option>
-<option value="paired-collection">Paired List Collection</option>
+<option value="tp">Transcripts paths</option>
 </param>
-<when value="separate">
-<param format="fastq,fastq.gz" help="FASTQ format" label="Forward reads" name="fwd_reads" type="data" />
-<param format="fastq,fastq.gz" help="FASTQ format" label="Reverse reads" name="rev_reads" type="data" />
-</when>
-<when value="interleaved">
-<param format="fastq,fastq.gz" help="FASTQ format" label="Interleaved paired reads" name="interleaved_reads" type="data" />
-</when>
-<when value="unpaired">
-<param format="fastq,fastq.gz" help="FASTQ format" label="Unpaired reads" name="unpaired_reads" type="data" />
-</when>
-<when value="paired-collection">
-<param name="fastq_collection" type="data_collection" collection_type="paired" format="fastq,fastq.gz" label="Paired-end reads collection" help="FASTQ format" />
-</when>
-</conditional>
-</repeat>
-</repeat>
-<param optional="true" format="fasta,fastq,fastq.gz" label="Trusted contigs" multiple="true" name="trusted_contigs" type="data" />
-<param optional="true" format="fasta,fastq,fastq.gz" label="Untrusted contigs" multiple="true" name="untrusted_contigs" type="data" />
 </inputs>
 <outputs>
-<data format="fasta" label="rnaSPAdes transcripts" name="output_transcripts" from_work_dir="transcripts.fasta" />
+<expand macro="out_cr"/>
+<data name="out_hft" format="fasta" from_work_dir="output/hard_filtered_transcripts.fasta" label="${tool.name} on ${on_string}: Hard filtered transcripts">
+<filter>'hft' in optional_output</filter>
+</data>
+<expand macro="out_l"/>
+<data name="out_sft" format="fasta" from_work_dir="output/soft_filtered_transcripts.fasta" label="${tool.name} on ${on_string}: Soft filtered transcripts">
+<filter>'sft' in optional_output</filter>
+</data>
+<data name="out_tr" format="fasta" from_work_dir="output/transcripts.fasta" label="${tool.name} on ${on_string}: Transcripts">
+<filter>'tr' in optional_output</filter>
+</data>
+<data name="out_tp" format="txt" from_work_dir="output/transcripts.paths" label="${tool.name} on ${on_string}: Transcripts paths">
+<filter>'tp' in optional_output</filter>
+</data>
 </outputs>
 <tests>
-<test>
+<!--
-<param name="lib_type" value="paired_end" />
+used in a test:
-<param name="type" value="separate" />
+single library: 12, 1, 2
-<param name="fwd_reads" value="rnaspades-in1-1.fq" ftype="fastq" />
+k, phred-offset, disablerr, iontorrent, only-assembler, ss
-<param name="rev_reads" value="rnaspades-in1-2.fq" ftype="fastq" />
-<output name="output_transcripts" file="rnaspades-out1.fa" ftype="fasta" compare="re_match" lines_diff="1" />
+not used in a test:
-</test>
+single library: merged, s
-<test>
+pacbio, nanopore, trusted-contigs, untrusted-contigs, fl-rna
-<param name="lib_type" value="paired_end" />
+-->
-<param name="type" value="separate" />
-<param name="fwd_reads" value="rnaspades-in1-1.fq.gz" ftype="fastq.gz" />
+<!-- #1 -->
-<param name="rev_reads" value="rnaspades-in1-2.fq.gz" ftype="fastq.gz" />
+<test expect_num_outputs="1">
-<output name="output_transcripts" file="rnaspades-out1.fa" ftype="fasta" compare="re_match" lines_diff="1" />
+<conditional name="singlePaired">
+<param name="sPaired" value="paired_interlaced"/>
+<param name="input1" value="ecoli_1K.fastq.gz"/>
+</conditional>
+<output name="out_tr">
+<assert_contents>
+<has_n_lines n="18"/>
+<has_text_matching expression=">NODE\_1\_length\_1000.+"/>
+</assert_contents>
+</output>
+</test>
+<!-- #2 single, separate, fastq, all outputs custom parameters-->
+<test expect_num_outputs="5">
+<conditional name="singlePaired">
+<param name="sPaired" value="paired"/>
+<param name="input1" value="ecoli_1K_1.fastq.gz"/>
+<param name="input2" value="ecoli_1K_2.fastq.gz"/>
+</conditional>
+<param name="phred_offset" value="33"/>
+<param name="ss" value="fr"/>
+<param name="optional_output" value="hft,l,sft,tr,tp"/>
+<output name="out_hft">
+<assert_contents>
+<has_n_lines n="18"/>
+</assert_contents>
+</output>
+<output name="out_sft">
+<assert_contents>
+<has_n_lines n="18"/>
+</assert_contents>
+</output>
+<output name="out_tr">
+<assert_contents>
+<has_n_lines n="18"/>
+</assert_contents>
+</output>
+<output name="out_tp">
+<assert_contents>
+<has_n_lines n="4"/>
+</assert_contents>
+</output>
+<output name="out_l">
+<assert_contents>
+<has_text_matching expression="Thank you for using SPAdes!"/>
+</assert_contents>
+</output>
+</test>
+<!-- #3 single, separate, fasta, default parameters -->
+<test expect_num_outputs="1">
+<conditional name="singlePaired">
+<param name="sPaired" value="paired"/>
+<param name="input1" value="ecoli_1K_1.fasta.gz"/>
+<param name="input2" value="ecoli_1K_2.fasta.gz"/>
+</conditional>
+<output name="out_tr">
+<assert_contents>
+<has_n_lines n="18"/>
+<has_text_matching expression=">NODE\_1\_length\_1000.+"/>
+</assert_contents>
+</output>
+</test>
+<!-- #3 Collection, default parameters -->
+<test expect_num_outputs="1">
+<conditional name="singlePaired">
+<param name="sPaired" value="paired_collection"/>
+<param name="input">
+<collection type="list:paired">
+<element name="ecoli.fastq">
+<collection type="paired">
+<element name="forward" value="ecoli_1K_1.fastq.gz" ftype="fastqsanger.gz"/>
+<element name="reverse" value="ecoli_1K_2.fastq.gz" ftype="fastqsanger.gz"/>
+</collection>
+</element>
+</collection>
+</param>
+</conditional>
+<output name="out_tr">
+<assert_contents>
+<has_n_lines n="18"/>
+<has_text_matching expression=">NODE\_1\_length\_1000.+"/>
+</assert_contents>
+</output>
+</test>
+<!-- #3 Hibryd assembly -->
+<test expect_num_outputs="1">
+<conditional name="singlePaired">
+<param name="sPaired" value="paired"/>
+<param name="input1" value="ecoli_1K_1.fasta.gz"/>
+<param name="input2" value="ecoli_1K_2.fasta.gz"/>
+</conditional>
+<section name="arf">
+<param name="nanopore" value="ecoli_1K.fastq.gz"/>
+<param name="pacbio" value="ecoli_1K.fastq.gz"/>
+<param name="trusted_contigs" value="ecoli_1K.fasta.gz"/>
+<param name="flrna" value="ecoli_1K.fasta.gz"/>
+</section>
+<assert_command>
+<has_text text="--nanopore"/>
+<has_text text="--pacbio"/>
+<has_text text="--trusted-contigs"/>
+<has_text text="--fl-rna"/>
+</assert_command>
+<output name="out_tr">
+<assert_contents>
+<has_n_lines n="18"/>
+<has_text_matching expression=">NODE\_1\_length\_1000.+"/>
+</assert_contents>
+</output>
 </test>
 </tests>
-<help>
+<help><![CDATA[
+.. class:: infomark
 **What it does**
-SPAdes – St. Petersburg genome assembler – is intended for both standard isolates and single-cell MDA bacteria assemblies. See http://bioinf.spbau.ru/en/spades for more details on SPAdes.
+@HELP_WID@
-This wrapper runs SPAdes 3.9.0, collects the output, and throws away all the temporary files.
+rnaSPAdes is a subtool for de novo transcriptome assembly from RNA-Seq data and is suitable for all kinds of organisms.
-**License**
+**Input**
-SPAdes is developed by and copyrighted to Saint-Petersburg Academic University, and is released under GPLv2.
+rnaSPAdes take as an input at least one paired-end or single-end library. For hybrid assembly you can use PacBio or Oxford Nanopore reads.
-The original wrapper was written by Lionel Guy, Philip Mabon and was released under the GNU General Public License as published by the Free Software Foundation. The rnaSPAdes extension was developed by the Galaxy team.
+In case you have sequenced several RNA-Seq libraries using the same protocol from different tissues / conditions, and the goal as to assemble a total transcriptome,
+we suggest to provide all files as a single library. Note, that sequencing using the same protocol implies that the resulting reads have the same length, insert size
-This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
+and strand-specificity. Transcript quantification for each sample can be done afterwards by separately mapping reads from each library to the assembled transcripts.
-You should have received a copy of the GNU General Public License along with this program.  If not, see http://www.gnu.org/licenses/.
+**Output**
-** Acknowledgments **
+@HELP_OUT_AG@
+@HELP_OUT_AGS@
-Anton Korobeynikov greatlty helped understanding how SPAdes work, and integrated handy features into SPAdes.
+@HELP_OUT_CR@
+- Hard filtered transcripts includes only long and reliable transcripts with rather high expression
-Nicola Soranzo fixed various bugs.
+@HELP_OUT_L@
-</help>
+- Soft filtered transcripts includes short and low-expressed transcipts, likely to contain junk sequences
-<citations>
+- Transcripts
-<citation type="doi">10.1089/cmb.2012.0021</citation>
+- Transcripts paths
-</citations>
+.. class:: infomark
+**References**
+More information can be found on on `github <https://github.com/ablab/spades>`_ and on the `project website <http://cab.spbu.ru/software/rnaspades>`_.
+]]></help>
+<expand macro="citations">
+<citation type="doi">10.1101/420208</citation>
+</expand>
 </tool>

Mercurial > repos > iuc > rnaspades

comparison rnaspades.xml @ 6:b66de1e9abfb draft