comparison check_strandedness.xml @ 0:0e1c639fc077 draft default tip

planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/check_strandedness commit e4c16166c27dff3e638817f7d6fc5fde0434edb7-dirty
author jjohnson
date Sat, 08 Oct 2022 17:00:18 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:0e1c639fc077
1 <tool id="check_strandedness" name="Check Strandedness" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" python_template_version="3.5" profile="21.05">
2 <description>using how_are_we_stranded_here</description>
3 <macros>
4 <token name="@TOOL_VERSION@">1.0.1</token>
5 <token name="@VERSION_SUFFIX@">0</token>
6 </macros>
7 <requirements>
8 <!-- pandas in how_are_we_stranded_here 1.0.1 does work with python 3.8 + -->
9 <requirement type="package" version="3.7">python</requirement>
10 <requirement type="package" version="@TOOL_VERSION@">how_are_we_stranded_here</requirement>
11 </requirements>
12 <command detect_errors="exit_code"><![CDATA[
13 #if $reads.type == 'paired':
14 ln -s '$reads.input_read1' reads1.fq &&
15 ln -s '$reads.input_read2' reads2.fq &&
16 #elif $reads.type == 'paired_collection':
17 ln -s '$reads.input_readpair.forward' reads1.fq &&
18 ln -s '$reads.input_readpair.reverse' reads1.fq &&
19 #end if
20 #if $kallisto_index
21 ln -s '$kallisto_index' kallisto_index &&
22 #end if
23 check_strandedness
24 --gtf '$gtf'
25 --transcripts '$transcripts'
26 --kallisto_index kallisto_index
27 --reads_1 reads1.fq
28 --reads_2 reads1.fq
29 #if $nreads
30 --nreads $nreads
31 #end if
32 $print_commands
33 > $log
34 ]]></command>
35 <inputs>
36 <conditional name="reads">
37 <param name="type" type="select" label="Library type of FASTQ">
38 <option value="paired">Paired-end</option>
39 <option value="paired_collection">Paired-end Dataset Collection</option>
40 </param>
41 <when value="paired">
42 <param name="input_read1" argument="--reads_1" type="data" format="fastq,fastq.gz" label="Reads #1 in FASTQ format" />
43 <param name="input_read2" argument="--reads_2" type="data" format="fastq,fastq.gz" label="Reads #2 in FASTQ format" />
44 </when>
45 <when value="paired_collection">
46 <param name="input_readpair" type="data_collection" collection_type="paired" format="fastq,fastq.gz" label="Paired Reads in FASTQ format" />
47 </when>
48 </conditional>
49 <param argument="--gtf" type="data" format="gtf" label="Reference Genome GTF file" />
50 <param argument="--transcripts" type="data" format="fasta" label="Reference Genome Transcripts cdna FASTA" />
51 <param argument="--kallisto_index" type="data" format="binary" optional="true" label="kallisto_index from previous check_strandedness job" help="must be from the same Transcripts cdna fasta"/>
52 <param argument="--nreads" type="integer" value="" min="1" optional="true" label="Number of reads to sample" help="Default: 200000"/>
53 <param argument="--print_commands" type="boolean" truevalue="--print_commands" falsevalue="" checked="false" label="print commands"/>
54 </inputs>
55 <outputs>
56 <data name="log" format="txt" label="${tool.name} on ${on_string}: log" />
57 <data name="index" format="binary" label="${tool.name} $transcripts.name kallisto_index" from_work_dir="kallisto_index">
58 <filter>kallisto_index is None</filter>
59 </data>
60 <data name="output" format="txt" label="${tool.name} on ${on_string}: strandedness_check" from_work_dir="stranded_test_reads1/strandedness_check.txt"/>
61 </outputs>
62 <tests>
63 <test>
64 <conditional name="reads">
65 <param name="type" value="paired"/>
66 <param name="input_read1" ftype="fastq.gz" value="hg38_F.fq.gz"/>
67 <param name="input_read2" ftype="fastq.gz" value="hg38_R.fq.gz"/>
68 </conditional>
69 <param name="gtf" ftype="gtf" value="hg38.gtf"/>
70 <param name="transcripts" ftype="fasta" value="hg38_transcripts.fa"/>
71 <param name="nreads" value="700"/>
72 <output name="log">
73 <assert_contents>
74 <has_text_matching expression="This is PairEnd Data"/>
75 <has_text_matching expression="Fraction of reads .* of explainable reads"/>
76 </assert_contents>
77 </output>
78 </test>
79 </tests>
80 <help><![CDATA[
81 **check_strandedness**
82
83 The **how_are_we_stranded_here** check_strandedness_ provide a quick determination of RNA-Seq strandedness.
84
85 https://github.com/signalbash/how_are_we_stranded_here
86
87 check_strandedness runs a series of commands to check which direction reads align once mapped in transcripts.
88 It first creates a kallisto index of your organisms transcriptome.
89 It then maps a small subset of reads (default 200000) to the transcriptome, and uses kallisto's --genomebam argument to project pseudoalignments to genome sorted BAM file.
90 It finally runs RSeQC's infer_experiment.py to check which direction reads from the first and second pairs are aligned in relation to the transcript strand, and provides output with the likely strandedness of your data.
91
92
93 ** SAMPLE OUTPUT **
94
95 ::
96
97 This is PairEnd Data
98 Fraction of reads failed to determine: 0.0595
99 Fraction of reads explained by "1++,1--,2+-,2-+": 0.0073 (0.8% of explainable reads)
100 Fraction of reads explained by "1+-,1-+,2++,2--": 0.9332 (99.2% of explainable reads)
101 Over 90% of reads explained by "1+-,1-+,2++,2--"
102 Data is likely RF/fr-firststrand
103
104 .. _how_are_we_stranded_here: https://github.com/signalbash/how_are_we_stranded_here
105 .. _check_strandedness: https://github.com/signalbash/how_are_we_stranded_here
106 ]]></help>
107 <citations>
108 <citation type="doi">10.1186/s12859-022-04572-7</citation>
109 </citations>
110 </tool>