annotate astral.xml @ 0:66ebc4b19d6c draft default tip

"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
author padge
date Wed, 13 Apr 2022 15:03:31 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
1 <tool id="astral" name="ASTRAL-III. Tool for estimating an unrooted species tree given a set of unrooted gene trees." version="0.1.0" python_template_version="3.5">
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
2 <requirements>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
3 <requirement type="package" version="5.7.8">astral-tree</requirement>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
4 </requirements>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
5 <command detect_errors="exit_code"><![CDATA[
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
6 astral -i $input1 -t ${branch_annotation_level_selector} -o ./output.tre -c $lambda 2> $log_output
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
7 &&
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
8 mv ./output.tre $output
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
9 #if $branch_annotation_level_selector == "16" or $branch_annotation_level_selector == "32"
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
10 &&
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
11 mv freqQuad.csv $branch_annotations
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
12 #end if;
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
13 ]]></command>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
14 <inputs>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
15 <param name="input1" type="data" format="newick" multiple="false" label="Tree file" optional="false" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
16 <param name="branch_annotation_level_selector" type="select" label="How much annotations should be added to each branch: 0, 1, or 2.">
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
17 <option value="3">3 (default): only the posterior probability for the main resolution.</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
18 <option value="0">0: no annotations.</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
19 <option value="1">1: only the quartet support for the main resolution.</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
20 <option value="2">2: full annotation.</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
21 <option value="4">4: three alternative posterior probabilities.</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
22 <option value="8">8: three alternative quartet scores.</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
23 <option value="16">16: for file export of branch annotations to freqQuad.csv (see below).</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
24 <option value="32">32: for file export of branch annotations to freqQuad.csv (see below).</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
25 <option value="10">10: p-values of a polytomy null hypothesis test. (default: 3)</option>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
26 </param>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
27 <param name="lambda" type="float" optional="true" value="0.5" min="0.0" max="10.0" label="lambda" help="lambda parameter for the Yule prior used in the calculations of
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
28 branch lengths and posterior probabilities. Default: 0.5" multiple="false"/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
29 </inputs>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
30 <outputs>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
31 <data name="output" format="newick" label="Output tree file"/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
32 <data name="log_output" format="txt" label="Astral log."/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
33 <data name="branch_annotations" format="tabular" label="Branch annotations file.">
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
34 <filter>branch_annotation_level_selector == '16' or branch_annotation_level_selector == '32'</filter>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
35 </data>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
36 </outputs>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
37 <tests>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
38 <test>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
39 <param name="input1" value="song_mammals.424.gene.tre"/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
40 <param name="branch_annotation_level_selector" value="16" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
41 <param name="lambda" value="2" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
42 <output name="output" file="song_mammals.tre" ftype="newick"/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
43 <output name="log_output">
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
44 <assert_contents>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
45 <has_line line="Number of taxa: 37 (37 species)" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
46 <has_line line="gradient0: 1933" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
47 <has_line line="Number of Clusters after addition by distance: 1933" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
48 <has_line line="Final quartet score is: 25526915" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
49 </assert_contents>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
50 </output>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
51 <output name="branch_annotations" file="freqQuad.csv" ftype="tabular"/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
52 </test>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
53 <test>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
54 <param name="input1" value="song_primates.424.gene.tre"/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
55 <param name="branch_annotation_level_selector" value="0" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
56 <param name="lambda" value="2" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
57 <output name="output" file="song_primates.tre" ftype="newick"/>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
58 <output name="log_output">
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
59 <assert_contents>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
60 <has_line line="Number of taxa: 14 (14 species)" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
61 <has_line line="gradient0: 339" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
62 <has_line line="Number of Clusters after addition by distance: 339" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
63 <has_line line="Final quartet score is: 389734" />
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
64 </assert_contents>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
65 </output>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
66 </test>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
67 </tests>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
68 <help><![CDATA[
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
69 Newick annotations
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
70 no annotations (-t 0): This turns off calculation and reporting of posterior probabilities and branch lengths.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
71 Quartet support (-t 1): The percentage of quartets in your gene trees that agree with a branch (normalized quartet support) give use a nice way of measuring the amount of gene tree conflict around a branch. Note that the local posterior probabilities are computed based on a transformation of normalized quartet scores (see Figure 2 of this paper).
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
72 Alternative quartet topologies (-t 8): Outputs q1, q2, q3; these three values show quartet support (as defined above) for the main topology (LR|SO), first alternative (RS|LO) and second alternative (RO|LS), respectively.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
73 Local posterior (-t 3): is the default where we show local posterior probability for the main topology.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
74 Alternative posteriors (-t 4): The output includes three local posterior probabilities: one for the main topology, and one for each of the two alternatives (RS|LO and RO|LS, in that order). The posterior of the three topologies adds up to 1. This is because of our locality assumption, which basically asserts that we assume the four groups around the branch (L, R, S, and O) are each correct and therefore, there are only three possible alternatives.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
75 Full annotation (-t 2): When you use this option, for each branch you get a lot of different measurements:
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
76 q1,q2,q3: these three values show quartet support (as defined in the description of -t 1) for the main topology, the first alternative, and the second alternative, respectively.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
77 f1, f2, f3: these three values show the total number of quartet trees in all the gene trees that support the main topology, the first alternative, and the second alternative, respectively.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
78 pp1, pp2, pp3: these three show the local posterior probabilities (as defined in the description of -t 4) for the main topology, the first alternative, and the second alternative, respectively.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
79 QC: this shows the total number of quartets defined around each branch (this is what our paper calls m).
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
80 EN: this is the effective number of genes for the branch. If you don't have any missing data, this would be the number of branches in your tree. When there are missing data, some gene trees might have nothing to say about a branch. Thus, the effective number of genes might be smaller than the total number of genes.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
81 Polytomy test (-t 10): runs an experimental test to see if a null hypothesis that the branch is a polytomy could be rejected. See this paper: doi:10.3390/genes9030132.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
82
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
83 File export of branch annotations
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
84 Since it is often hard to know which branch is L and which branch is R, understanding branch annotations is a bit hard for most users.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
85 To help, we have added a feature for outputting some of the branch annotations into a .csv file.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
86 Note that we strongly suggest using DiscoVista to visualize the quartet frequencies. If you find DiscoVista hard to install and use, you can instead use these .csv files.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
87
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
88 To get the .csv outputs, you can use -t 16 and -t 32.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
89 .csv output has the following format.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
90 The output file is always called freqQuad.csv and is written to the same directory as the input file (sorry for the ugliness!)
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
91 The file is tab-delimited.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
92 1st column: a dummy name for the node. Note that each three lines in a row have the same node number. Around each node, we have three possible unrooted toplogies (NNI rearrangements). We show stats for these three rearrangements.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
93 2nd column: the topology name for which we are giving the scores. Here, t1 is always the main topology (observed in your species tree) and t2 and t3 are the two alternatives.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
94 3rd column: Gives the actual topology with the format: {A}|{B}#{C}|{D}. This means that the quartet topology being scored is putting groups A and B together on one side, and groups C and D on the other side. Please remember that quartets are unrooted trees. Each of the groups is a comma-separate list of species.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
95 5th column: number of gene trees that match the the topology in this line.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
96 You will note that this number is not always an integer number. The reason is that in each gene tree, groups A, B, C, and D may not be together. Those gene trees still count as 1 unit, but they can contribute a fraction of that total of 1 to each of the tree topologies. So a gene tree may count as 0.7 for one topology, 0.2 for another, and 0.1 for the third.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
97 6th column: This is the total number of gene trees that had any useful information about this branch.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
98 If you have no missing data, this should equal the total number of gene trees.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
99 If you have missing data, some genes may be missing one of groups A, B, C, or D entirely. Those genes will be agnostic about this branch. This column gives the number of genes that have at least one species from each of A, B, C, and D.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
100 4th column is likely you are interested in and it depends on whether you used -t 16 or -t 32.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
101 -t 16: This column is the local posterior for the topology given in this line. Note that the local posterior probability is different from normalized quartet score. See Figure 2 of this paper.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
102 -t 32: This column is simply 5th column divided by 6 column. Thus, it gives the normalized quartet score for that topology. Note that the three lines with the same node name (1st column) will add up to one in their 4th column.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
103
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
104 Prior hyper-parameter
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
105 Our calculations of the local posterior probabilities and branch lengths use a Yule prior model for the branch lengths of the species tree.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
106 The speciation rate (in coalescent units) of the Yule process (lambda) is by default set to 0.5, which results in a flat prior for the quartet frequencies in the [1/3,1] range.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
107 Using -c option one can adjust the hyper-parameter for the prior.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
108 For example, you might want to estimate lambda from the data after one run and plug the estimate prior in a subsequent run.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
109 We have not yet fully explored the impact of lambda on the posterior.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
110 For branch lengths, lambda acts as a pseudocount and can have a substantial impact on the estimated branch length for very long branches.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
111 More specifically, if there is no, or very little discordance around a branch,
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
112 the MAP lengths of the branch (which is what we report) is almost fully determined by the prior.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
113
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
114 Note that setting lambda to 0 results in reporting ML estimates of the branch lengths instead of MAP.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
115 However, for branches with no discordance, we cannot compute a branch lengths.
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
116 For these, we currently arbitrarily set ML to 10 coalescent units (we might change this in future versions).
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
117
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
118 ]]></help>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
119 <citations>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
120 <citation type="bibtex">
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
121 @misc{githubASTRAL,
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
122 author = {LastTODO, FirstTODO},
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
123 year = {TODO},
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
124 title = {ASTRAL},
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
125 publisher = {GitHub},
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
126 journal = {GitHub repository},
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
127 url = {https://github.com/smirarab/ASTRAL},
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
128 }</citation>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
129 </citations>
66ebc4b19d6c "planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff changeset
130 </tool>