Mercurial > repos > jjohnson > check_strandedness
comparison check_strandedness.xml @ 0:0e1c639fc077 draft default tip
planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/check_strandedness commit e4c16166c27dff3e638817f7d6fc5fde0434edb7-dirty
author | jjohnson |
---|---|
date | Sat, 08 Oct 2022 17:00:18 +0000 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:0e1c639fc077 |
---|---|
1 <tool id="check_strandedness" name="Check Strandedness" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" python_template_version="3.5" profile="21.05"> | |
2 <description>using how_are_we_stranded_here</description> | |
3 <macros> | |
4 <token name="@TOOL_VERSION@">1.0.1</token> | |
5 <token name="@VERSION_SUFFIX@">0</token> | |
6 </macros> | |
7 <requirements> | |
8 <!-- pandas in how_are_we_stranded_here 1.0.1 does work with python 3.8 + --> | |
9 <requirement type="package" version="3.7">python</requirement> | |
10 <requirement type="package" version="@TOOL_VERSION@">how_are_we_stranded_here</requirement> | |
11 </requirements> | |
12 <command detect_errors="exit_code"><![CDATA[ | |
13 #if $reads.type == 'paired': | |
14 ln -s '$reads.input_read1' reads1.fq && | |
15 ln -s '$reads.input_read2' reads2.fq && | |
16 #elif $reads.type == 'paired_collection': | |
17 ln -s '$reads.input_readpair.forward' reads1.fq && | |
18 ln -s '$reads.input_readpair.reverse' reads1.fq && | |
19 #end if | |
20 #if $kallisto_index | |
21 ln -s '$kallisto_index' kallisto_index && | |
22 #end if | |
23 check_strandedness | |
24 --gtf '$gtf' | |
25 --transcripts '$transcripts' | |
26 --kallisto_index kallisto_index | |
27 --reads_1 reads1.fq | |
28 --reads_2 reads1.fq | |
29 #if $nreads | |
30 --nreads $nreads | |
31 #end if | |
32 $print_commands | |
33 > $log | |
34 ]]></command> | |
35 <inputs> | |
36 <conditional name="reads"> | |
37 <param name="type" type="select" label="Library type of FASTQ"> | |
38 <option value="paired">Paired-end</option> | |
39 <option value="paired_collection">Paired-end Dataset Collection</option> | |
40 </param> | |
41 <when value="paired"> | |
42 <param name="input_read1" argument="--reads_1" type="data" format="fastq,fastq.gz" label="Reads #1 in FASTQ format" /> | |
43 <param name="input_read2" argument="--reads_2" type="data" format="fastq,fastq.gz" label="Reads #2 in FASTQ format" /> | |
44 </when> | |
45 <when value="paired_collection"> | |
46 <param name="input_readpair" type="data_collection" collection_type="paired" format="fastq,fastq.gz" label="Paired Reads in FASTQ format" /> | |
47 </when> | |
48 </conditional> | |
49 <param argument="--gtf" type="data" format="gtf" label="Reference Genome GTF file" /> | |
50 <param argument="--transcripts" type="data" format="fasta" label="Reference Genome Transcripts cdna FASTA" /> | |
51 <param argument="--kallisto_index" type="data" format="binary" optional="true" label="kallisto_index from previous check_strandedness job" help="must be from the same Transcripts cdna fasta"/> | |
52 <param argument="--nreads" type="integer" value="" min="1" optional="true" label="Number of reads to sample" help="Default: 200000"/> | |
53 <param argument="--print_commands" type="boolean" truevalue="--print_commands" falsevalue="" checked="false" label="print commands"/> | |
54 </inputs> | |
55 <outputs> | |
56 <data name="log" format="txt" label="${tool.name} on ${on_string}: log" /> | |
57 <data name="index" format="binary" label="${tool.name} $transcripts.name kallisto_index" from_work_dir="kallisto_index"> | |
58 <filter>kallisto_index is None</filter> | |
59 </data> | |
60 <data name="output" format="txt" label="${tool.name} on ${on_string}: strandedness_check" from_work_dir="stranded_test_reads1/strandedness_check.txt"/> | |
61 </outputs> | |
62 <tests> | |
63 <test> | |
64 <conditional name="reads"> | |
65 <param name="type" value="paired"/> | |
66 <param name="input_read1" ftype="fastq.gz" value="hg38_F.fq.gz"/> | |
67 <param name="input_read2" ftype="fastq.gz" value="hg38_R.fq.gz"/> | |
68 </conditional> | |
69 <param name="gtf" ftype="gtf" value="hg38.gtf"/> | |
70 <param name="transcripts" ftype="fasta" value="hg38_transcripts.fa"/> | |
71 <param name="nreads" value="700"/> | |
72 <output name="log"> | |
73 <assert_contents> | |
74 <has_text_matching expression="This is PairEnd Data"/> | |
75 <has_text_matching expression="Fraction of reads .* of explainable reads"/> | |
76 </assert_contents> | |
77 </output> | |
78 </test> | |
79 </tests> | |
80 <help><![CDATA[ | |
81 **check_strandedness** | |
82 | |
83 The **how_are_we_stranded_here** check_strandedness_ provide a quick determination of RNA-Seq strandedness. | |
84 | |
85 https://github.com/signalbash/how_are_we_stranded_here | |
86 | |
87 check_strandedness runs a series of commands to check which direction reads align once mapped in transcripts. | |
88 It first creates a kallisto index of your organisms transcriptome. | |
89 It then maps a small subset of reads (default 200000) to the transcriptome, and uses kallisto's --genomebam argument to project pseudoalignments to genome sorted BAM file. | |
90 It finally runs RSeQC's infer_experiment.py to check which direction reads from the first and second pairs are aligned in relation to the transcript strand, and provides output with the likely strandedness of your data. | |
91 | |
92 | |
93 ** SAMPLE OUTPUT ** | |
94 | |
95 :: | |
96 | |
97 This is PairEnd Data | |
98 Fraction of reads failed to determine: 0.0595 | |
99 Fraction of reads explained by "1++,1--,2+-,2-+": 0.0073 (0.8% of explainable reads) | |
100 Fraction of reads explained by "1+-,1-+,2++,2--": 0.9332 (99.2% of explainable reads) | |
101 Over 90% of reads explained by "1+-,1-+,2++,2--" | |
102 Data is likely RF/fr-firststrand | |
103 | |
104 .. _how_are_we_stranded_here: https://github.com/signalbash/how_are_we_stranded_here | |
105 .. _check_strandedness: https://github.com/signalbash/how_are_we_stranded_here | |
106 ]]></help> | |
107 <citations> | |
108 <citation type="doi">10.1186/s12859-022-04572-7</citation> | |
109 </citations> | |
110 </tool> |