comparison hyphy_gard.xml @ 5:6283babe736e draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/hyphy/ commit 8d5ae1d04c43988fdcc458f4f08376a15e72db8e"
author iuc
date Thu, 20 Feb 2020 18:14:24 -0500
parents bff9a82d630d
children aa8cc71438cf
comparison
equal deleted inserted replaced
4:c454b670f35f 5:6283babe736e
8 <command detect_errors="exit_code"><![CDATA[ 8 <command detect_errors="exit_code"><![CDATA[
9 ln -s '$input_file' gard_input.fa && 9 ln -s '$input_file' gard_input.fa &&
10 @HYPHYMPI@ gard 10 @HYPHYMPI@ gard
11 --alignment ./gard_input.fa 11 --alignment ./gard_input.fa
12 --type '$datatype.value' 12 --type '$datatype.value'
13 #if str($datatype.value) == 'Codon': 13 #if str($datatype.value) == 'codon':
14 --code '$datatype.gencodeid' 14 --code '$datatype.gencodeid'
15 #elif str($datatype.value) == 'Protein': 15 #elif str($datatype.value) == 'amino-acid':
16 --model '$datatype.model' 16 --model '$datatype.model'
17 #end if 17 #end if
18 --rv '$rate_cond.rate' 18 #if str($rate_cond.rate):
19 #if str($rate_cond.rate) != 'None': 19 --rv '$rate_cond.rate'
20 --rate-classes '$rate_classes' 20 --rate-classes '$rate_classes'
21 #end if 21 #end if
22 --output '$translated' 22 --output '$translated'
23 --output-lf '$gard_output' 23 --output-lf '$gard_output'
24 > '$gard_log' 24 > '$gard_log'
25 ]]></command> 25 ]]></command>
26 <inputs> 26 <inputs>
27 <param name="input_file" type="data" format="fasta" label="Input FASTA file"/> 27 <param name="input_file" type="data" format="fasta" label="Input FASTA file"/>
28 <conditional name="datatype"> 28 <conditional name="datatype">
29 <param name="value" type="select" label="Type of data"> 29 <param argument="--type" name="value" type="select" label="Alignment kind">
30 <option value="nucleotide">Nucleotide</option> 30 <option value="nucleotide">Nucleotide</option>
31 <option value="protein">Amino acid</option> 31 <option value="amino-acid">Amino acid</option>
32 <option value="codon">Codon</option> 32 <option value="codon">Codon</option>
33 </param> 33 </param>
34 <when value="Nucleotide"/> 34 <when value="nucleotide"/>
35 <when value="Protein"> 35 <when value="amino-acid">
36 <expand macro="substitution" /> 36 <expand macro="substitution" />
37 </when> 37 </when>
38 <when value="Codon"> 38 <when value="codon">
39 <expand macro="gencode" /> 39 <expand macro="gencode" />
40 </when> 40 </when>
41 </conditional> 41 </conditional>
42 <conditional name="rate_cond"> 42 <conditional name="rate_cond">
43 <param name="rate" type="select" label="Rate variation"> 43 <param argument="--rv" name="rate" type="select" label="Rate variation">
44 <option value="None">None</option> 44 <option value="">None</option>
45 <option value="GDD">General Discrete</option> 45 <option value="GDD">General Discrete</option>
46 <option value="Gamma">Beta-Gamma</option> 46 <option value="Gamma">Beta-Gamma</option>
47 </param> 47 </param>
48 <when value="None"/> 48 <when value=""/>
49 <when value="GDD"> 49 <when value="GDD">
50 <param name="rate_classes" type="integer" value="2" min="2" max="6" label="Rate classes"/> 50 <param argument="--rate-classes" name="rate_classes" type="integer" value="2" min="2" max="6" label="Rate classes" />
51 </when> 51 </when>
52 <when value="Gamma"> 52 <when value="Gamma">
53 <param name="rate_classes" type="integer" value="2" min="2" max="6" label="Rate classes"/> 53 <param argument="--rate-classes" name="rate_classes" type="integer" value="2" min="2" max="6" label="Rate classes" />
54 </when> 54 </when>
55 </conditional> 55 </conditional>
56 </inputs> 56 </inputs>
57 <outputs> 57 <outputs>
58 <data name="gard_log" format="txt"/> 58 <data name="gard_log" format="txt"/>
64 <param name="input_file" ftype="fasta" value="gard-in1.fa"/> 64 <param name="input_file" ftype="fasta" value="gard-in1.fa"/>
65 <output name="gard_output" file="gard-out1.nex" compare="sim_size" delta="160000"/> 65 <output name="gard_output" file="gard-out1.nex" compare="sim_size" delta="160000"/>
66 </test> 66 </test>
67 </tests> 67 </tests>
68 <help><![CDATA[ 68 <help><![CDATA[
69 GARD (Genetic Algorithm for Recombination Detection) is a method to screen a multiple sequence analysis for the presence of recombination and is extremely useful as a pre-processing step for selection inference. Because recombinant sequences cannot be adequately described with a single phylogenetic history, selection inference on recombinant data often leads to a significant increase in false positives. GARD alleviates this concern by comprehensively screening an alignment for recombination breakpoints and inferring a unique phylogenetic history for each detected recombination block.
70 69
71 See the online documentation_ for more information. 70 GARD : Genetic Algorithms for Recombination Detection.
71 ======================================================
72 72
73 .. _documentation: http://hyphy.org/methods/selection-methods/#gard 73 What does this do?
74 ------------------
75
76 This tools screens an alignment of sequences for evidence of recombination in one or more sequences.
77 The main idea is that if sufficient recombination has occurred, then no single phylogenetic tree will
78 properly fit the entire length of the alignment and instead a separate tree will be preferred for each *nonrecombinant* segment.
79
80 Brief description
81 -----------------
82
83 This analysis implements a heuristic approach to screening alignments of sequences for
84 recombination, by using the CHC genetic algorithm (GA) to search for
85 phylogenetic incongruence among different partitions of the data. The
86 number of partitions is determined using a step-up procedure, while the
87 placement of breakpoints is searched for with the GA. The best fitting
88 model (based on c-AIC) is returned; and additional post-hoc tests run to
89 distinguish topological incongruence from rate-variation.
90
91 For each identified breakpoint, the support for its placement is calculated, and for each
92 non-recombinant fragment, a phylogenetic tree is inferred (using neighbor joining) and returned.
93
94 Input
95 -----
96
97 A *FASTA* sequence alignment
98
99 Output
100 ------
101
102 A JSON file with analysis results (http://hyphy.org/resources/json-fields.pdf).
103
104 A custom visualization module for viewing these results is available (see http://vision.hyphy.org/GARD for an example)
105
106
107 Tool options
108 ------------
109 ::
110
111
112 --type type of alignment to screen
113 Nucleotide [default].
114 Assumes aligned nucleotide data and screens the alignment using
115 the general time reversible model of sequence evolution.
116 This is the fastest option
117 Protein
118 Assumes aligned aminoacid sequences. One of several protein
119 substitution models may be used to screen the alignment.
120 Codon
121 Assumes an in-frame coding sequence alignment.
122 The Muse-Gaut 94 (GTR) model will be used to screen the alignment.
123 Selecting this option will dramatically increase run times.
124
125
126 --code Genetic code/translation table to use (for codon alignments).
127 Default value: Universal
128
129 --model The substitution model to use (for protein alignments).
130 default value: JTT
131
132 --rv The discrete distribution to use for modeling site to site rate variation.
133
134 None [default]
135 No rate variation. This is the fastest option in terms of run time, but
136 using it can result in false positives if there is significant site-to-site
137 rate variation
138 GDD
139 Use the general discrete distribution on N bins
140 Beta-Gamma
141 Use a discretized gamma with weights partitioned by a discretized beta
142 (see doi.org/10.1093/molbev/msi009)
143
144 --rate-classes How many site rate classes to use (if GDD or Beta-Gamma are selected)
145 default value: 4
146
147
74 ]]></help> 148 ]]></help>
75 <expand macro="citations"> 149 <expand macro="citations">
76 <citation type="doi">10.1093/molbev/msl051</citation> 150 <citation type="doi">10.1093/molbev/msl051</citation>
77 </expand> 151 </expand>
78 </tool> 152 </tool>