annotate arriba.xml @ 0:5ebf2354cc9b draft

"planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
author jjohnson
date Thu, 07 Oct 2021 11:47:02 +0000
parents
children 9f2665b32c45
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
1 <tool id="arriba" name="Arriba" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" python_template_version="3.5">
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
2 <description>detect gene fusions from STAR aligned RNA-Seq data</description>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
3 <macros>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
4 <import>macros.xml</import>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
5 </macros>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
6 <expand macro="requirements" />
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
7 <expand macro="version_command" />
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
8 <command detect_errors="exit_code"><![CDATA[
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
9 arriba
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
10 -x '$input'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
11 #if $chimeric
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
12 -c '$chimeric'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
13 #endif
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
14 -a '$genome_assembly'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
15 -g '$gtf'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
16 -b '$blacklist'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
17 #if '$protein_domains'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
18 -p '$protein_domains'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
19 #endif
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
20 #if '$known_fusions'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
21 -k '$known_fusions'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
22 #endif
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
23 #if '$tags'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
24 -t '$tags'
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
25 #endif
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
26 -o fusions.tsv
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
27 -O fusions.discarded.tsv
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
28 ]]></command>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
29 <inputs>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
30 <param name="input" argument="-x" type="data" format="sam,bam,cram" label="STAR Aligned.out.sam"/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
31 <param name="chimeric" argument="-c" type="data" format="sam,bam,cram" optional="true" label="STAR Chimeric.out.sam">
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
32 <help><![CDATA[ only required, if STAR was run with the parameter '--chimOutType SeparateSAMold' ]]></help>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
33 </param>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
34 <param name="genome_assembly" argument="-a" type="data" format="fasta" label="genome assembly fasta"/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
35 <param name="gtf" argument="-g" type="data" format="gtf" label="GTF file with gene annotation"/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
36 <param name="blacklist" argument="-b" type="data" format="tabular" label="File containing blacklisted ranges."/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
37 <param name="protein_domains" argument="-p" type="data" format="gff3" optional="true" label="File containing blacklisted ranges."/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
38 <param name="known_fusions" argument="-k" type="data" format="tabular" optional="true" label="File containing known fusions">
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
39 <help><![CDATA[ file two TAB separated columns: five-prime region three-prime region ]]></help>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
40 </param>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
41 <param name="tags" argument="-t" type="data" format="tabular" optional="true" label="File containing tag names for a fusion."/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
42 </inputs>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
43 <outputs>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
44 <data name="fusions" format="tabular" label="${tool.name} on ${on_string}: fusions.tsv" from_work_dir="fusions.tsv"/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
45 <data name="discarded" format="tabular" label="${tool.name} on ${on_string}: fusions.discarded.tsv" from_work_dir="fusions.discarded.tsv"/>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
46 </outputs>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
47 <help><![CDATA[
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
48
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
49 arriba -h
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
50 [2021-10-06T19:04:33] Launching Arriba 2.1.0
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
51
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
52 Arriba gene fusion detector
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
53 ---------------------------
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
54 Version: 2.1.0
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
55
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
56 Arriba is a fast tool to search for aberrant transcripts such as gene fusions.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
57 It is based on chimeric alignments found by the STAR RNA-Seq aligner.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
58
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
59 Usage: arriba [-c Chimeric.out.sam] -x Aligned.out.bam \
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
60 -g annotation.gtf -a assembly.fa [-b blacklists.tsv] [-k known_fusions.tsv] \
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
61 [-t tags.tsv] [-p protein_domains.gff3] [-d structural_variants_from_WGS.tsv] \
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
62 -o fusions.tsv [-O fusions.discarded.tsv] \
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
63 [OPTIONS]
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
64
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
65 -c FILE File in SAM/BAM/CRAM format with chimeric alignments as generated by STAR
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
66 (Chimeric.out.sam). This parameter is only required, if STAR was run with the
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
67 parameter '--chimOutType SeparateSAMold'. When STAR was run with the parameter
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
68 '--chimOutType WithinBAM', it suffices to pass the parameter -x to Arriba and -c
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
69 can be omitted.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
70
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
71 -x FILE File in SAM/BAM/CRAM format with main alignments as generated by STAR
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
72 (Aligned.out.sam). Arriba extracts candidate reads from this file.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
73
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
74 -g FILE GTF file with gene annotation. The file may be gzip-compressed.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
75
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
76 -G GTF_FEATURES Comma-/space-separated list of names of GTF features.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
77 Default: gene_name=gene_name|gene_id gene_id=gene_id
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
78 transcript_id=transcript_id feature_exon=exon feature_CDS=CDS
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
79
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
80 -a FILE FastA file with genome sequence (assembly). The file may be gzip-compressed. An
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
81 index with the file extension .fai must exist only if CRAM files are processed.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
82
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
83 -b FILE File containing blacklisted events (recurrent artifacts and transcripts
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
84 observed in healthy tissue).
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
85
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
86 -k FILE File containing known/recurrent fusions. Some cancer entities are often
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
87 characterized by fusions between the same pair of genes. In order to boost
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
88 sensitivity, a list of known fusions can be supplied using this parameter. The list
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
89 must contain two columns with the names of the fused genes, separated by tabs.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
90
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
91 -o FILE Output file with fusions that have passed all filters.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
92
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
93 -O FILE Output file with fusions that were discarded due to filtering.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
94
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
95 -t FILE Tab-separated file containing fusions to annotate with tags in the 'tags' column.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
96 The first two columns specify the genes; the third column specifies the tag. The
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
97 file may be gzip-compressed.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
98
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
99 -p FILE File in GFF3 format containing coordinates of the protein domains of genes. The
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
100 protein domains retained in a fusion are listed in the column
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
101 'retained_protein_domains'. The file may be gzip-compressed.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
102
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
103 -d FILE Tab-separated file with coordinates of structural variants found using
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
104 whole-genome sequencing data. These coordinates serve to increase sensitivity
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
105 towards weakly expressed fusions and to eliminate fusions with low evidence.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
106
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
107 -D MAX_GENOMIC_BREAKPOINT_DISTANCE When a file with genomic breakpoints obtained via
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
108 whole-genome sequencing is supplied via the -d
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
109 parameter, this parameter determines how far a
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
110 genomic breakpoint may be away from a
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
111 transcriptomic breakpoint to consider it as a
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
112 related event. For events inside genes, the
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
113 distance is added to the end of the gene; for
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
114 intergenic events, the distance threshold is
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
115 applied as is. Default: 100000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
116
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
117 -s STRANDEDNESS Whether a strand-specific protocol was used for library preparation,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
118 and if so, the type of strandedness (auto/yes/no/reverse). When
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
119 unstranded data is processed, the strand can sometimes be inferred from
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
120 splice-patterns. But in unclear situations, stranded data helps
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
121 resolve ambiguities. Default: auto
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
122
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
123 -i CONTIGS Comma-/space-separated list of interesting contigs. Fusions between genes
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
124 on other contigs are ignored. Contigs can be specified with or without the
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
125 prefix "chr". Asterisks (*) are treated as wild-cards.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
126 Default: 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 X Y AC_* NC_*
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
127
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
128 -v CONTIGS Comma-/space-separated list of viral contigs. Asterisks (*) are treated as
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
129 wild-cards.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
130 Default: AC_* NC_*
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
131
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
132 -f FILTERS Comma-/space-separated list of filters to disable. By default all filters are
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
133 enabled. Valid values: homologs, low_entropy, isoforms,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
134 top_expressed_viral_contigs, viral_contigs, non_coding_neighbors,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
135 mismatches, duplicates, no_genomic_support, genomic_support, intronic,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
136 end_to_end, relative_support, low_coverage_viral_contigs,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
137 merge_adjacent, mismappers, multimappers, same_gene, long_gap,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
138 internal_tandem_duplication, small_insert_size, read_through,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
139 inconsistently_clipped, uninteresting_contigs, intragenic_exonic,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
140 spliced, hairpin, blacklist, min_support, select_best, in_vitro,
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
141 short_anchor, known_fusions, no_coverage, homopolymer, many_spliced
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
142
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
143 -E MAX_E-VALUE Arriba estimates the number of fusions with a given number of supporting
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
144 reads which one would expect to see by random chance. If the expected number
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
145 of fusions (e-value) is higher than this threshold, the fusion is
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
146 discarded by the 'relative_support' filter. Note: Increasing this
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
147 threshold can dramatically increase the number of false positives and may
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
148 increase the runtime of resource-intensive steps. Fractional values are
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
149 possible. Default: 0.300000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
150
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
151 -S MIN_SUPPORTING_READS The 'min_support' filter discards all fusions with fewer than
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
152 this many supporting reads (split reads and discordant mates
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
153 combined). Default: 2
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
154
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
155 -m MAX_MISMAPPERS When more than this fraction of supporting reads turns out to be
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
156 mismappers, the 'mismappers' filter discards the fusion. Default:
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
157 0.800000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
158
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
159 -L MAX_HOMOLOG_IDENTITY Genes with more than the given fraction of sequence identity are
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
160 considered homologs and removed by the 'homologs' filter.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
161 Default: 0.300000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
162
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
163 -H HOMOPOLYMER_LENGTH The 'homopolymer' filter removes breakpoints adjacent to
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
164 homopolymers of the given length or more. Default: 6
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
165
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
166 -R READ_THROUGH_DISTANCE The 'read_through' filter removes read-through fusions
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
167 where the breakpoints are less than the given distance away
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
168 from each other. Default: 10000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
169
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
170 -A MIN_ANCHOR_LENGTH Alignment artifacts are often characterized by split reads coming
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
171 from only one gene and no discordant mates. Moreover, the split
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
172 reads only align to a short stretch in one of the genes. The
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
173 'short_anchor' filter removes these fusions. This parameter sets
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
174 the threshold in bp for what the filter considers short. Default: 23
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
175
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
176 -M MANY_SPLICED_EVENTS The 'many_spliced' filter recovers fusions between genes that
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
177 have at least this many spliced breakpoints. Default: 4
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
178
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
179 -K MAX_KMER_CONTENT The 'low_entropy' filter removes reads with repetitive 3-mers. If
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
180 the 3-mers make up more than the given fraction of the sequence, then
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
181 the read is discarded. Default: 0.600000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
182
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
183 -V MAX_MISMATCH_PVALUE The 'mismatches' filter uses a binomial model to calculate a
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
184 p-value for observing a given number of mismatches in a read. If
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
185 the number of mismatches is too high, the read is discarded.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
186 Default: 0.010000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
187
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
188 -F FRAGMENT_LENGTH When paired-end data is given, the fragment length is estimated
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
189 automatically and this parameter has no effect. But when single-end
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
190 data is given, the mean fragment length should be specified to
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
191 effectively filter fusions that arise from hairpin structures.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
192 Default: 200
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
193
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
194 -U MAX_READS Subsample fusions with more than the given number of supporting reads. This
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
195 improves performance without compromising sensitivity, as long as the
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
196 threshold is high. Counting of supporting reads beyond the threshold is
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
197 inaccurate, obviously. Default: 300
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
198
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
199 -Q QUANTILE Highly expressed genes are prone to produce artifacts during library
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
200 preparation. Genes with an expression above the given quantile are eligible
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
201 for filtering by the 'in_vitro' filter. Default: 0.998000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
202
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
203 -e EXONIC_FRACTION The breakpoints of false-positive predictions of intragenic events
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
204 are often both in exons. True predictions are more likely to have at
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
205 least one breakpoint in an intron, because introns are larger. If the
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
206 fraction of exonic sequence between two breakpoints is smaller than
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
207 the given fraction, the 'intragenic_exonic' filter discards the
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
208 event. Default: 0.330000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
209
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
210 -T TOP_N Only report viral integration sites of the top N most highly expressed viral
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
211 contigs. Default: 5
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
212
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
213 -C COVERED_FRACTION Ignore virally associated events if the virus is not fully
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
214 expressed, i.e., less than the given fraction of the viral contig is
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
215 transcribed. Default: 0.150000
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
216
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
217 -l MAX_ITD_LENGTH Maximum length of internal tandem duplications. Note: Increasing
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
218 this value beyond the default can impair performance and lead to many
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
219 false positives. Default: 100
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
220
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
221 -u Instead of performing duplicate marking itself, Arriba relies on duplicate marking by a
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
222 preceding program using the BAM_FDUP flag. This makes sense when unique molecular
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
223 identifiers (UMI) are used.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
224
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
225 -X To reduce the runtime and file size, by default, the columns 'fusion_transcript',
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
226 'peptide_sequence', and 'read_identifiers' are left empty in the file containing
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
227 discarded fusion candidates (see parameter -O). When this flag is set, this extra
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
228 information is reported in the discarded fusions file.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
229
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
230 -I If assembly of the fusion transcript sequence from the supporting reads is incomplete
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
231 (denoted as '...'), fill the gaps using the assembly sequence wherever possible.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
232
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
233 -h Print help and exit.
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
234
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
235 Code repository: https://github.com/suhrig/arriba
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
236 Get help/report bugs: https://github.com/suhrig/arriba/issues
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
237 User manual: https://arriba.readthedocs.io/
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
238 Please cite: https://doi.org/10.1101/gr.257246.119
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
239
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
240 ]]></help>
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
241 <expand macro="citations" />
5ebf2354cc9b "planemo upload for repository https://github.com/jj-umn/tools-iuc/tree/arriba/tools/arriba commit 52c9f9825debe783339c13bd1da9a42b59747bd2"
jjohnson
parents:
diff changeset
242 </tool>