Mercurial > repos > padge > astral
annotate astral.xml @ 0:66ebc4b19d6c draft default tip
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
author | padge |
---|---|
date | Wed, 13 Apr 2022 15:03:31 +0000 |
parents | |
children |
rev | line source |
---|---|
0
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
1 <tool id="astral" name="ASTRAL-III. Tool for estimating an unrooted species tree given a set of unrooted gene trees." version="0.1.0" python_template_version="3.5"> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
2 <requirements> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
3 <requirement type="package" version="5.7.8">astral-tree</requirement> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
4 </requirements> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
5 <command detect_errors="exit_code"><![CDATA[ |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
6 astral -i $input1 -t ${branch_annotation_level_selector} -o ./output.tre -c $lambda 2> $log_output |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
7 && |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
8 mv ./output.tre $output |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
9 #if $branch_annotation_level_selector == "16" or $branch_annotation_level_selector == "32" |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
10 && |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
11 mv freqQuad.csv $branch_annotations |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
12 #end if; |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
13 ]]></command> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
14 <inputs> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
15 <param name="input1" type="data" format="newick" multiple="false" label="Tree file" optional="false" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
16 <param name="branch_annotation_level_selector" type="select" label="How much annotations should be added to each branch: 0, 1, or 2."> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
17 <option value="3">3 (default): only the posterior probability for the main resolution.</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
18 <option value="0">0: no annotations.</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
19 <option value="1">1: only the quartet support for the main resolution.</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
20 <option value="2">2: full annotation.</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
21 <option value="4">4: three alternative posterior probabilities.</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
22 <option value="8">8: three alternative quartet scores.</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
23 <option value="16">16: for file export of branch annotations to freqQuad.csv (see below).</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
24 <option value="32">32: for file export of branch annotations to freqQuad.csv (see below).</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
25 <option value="10">10: p-values of a polytomy null hypothesis test. (default: 3)</option> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
26 </param> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
27 <param name="lambda" type="float" optional="true" value="0.5" min="0.0" max="10.0" label="lambda" help="lambda parameter for the Yule prior used in the calculations of |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
28 branch lengths and posterior probabilities. Default: 0.5" multiple="false"/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
29 </inputs> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
30 <outputs> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
31 <data name="output" format="newick" label="Output tree file"/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
32 <data name="log_output" format="txt" label="Astral log."/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
33 <data name="branch_annotations" format="tabular" label="Branch annotations file."> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
34 <filter>branch_annotation_level_selector == '16' or branch_annotation_level_selector == '32'</filter> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
35 </data> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
36 </outputs> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
37 <tests> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
38 <test> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
39 <param name="input1" value="song_mammals.424.gene.tre"/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
40 <param name="branch_annotation_level_selector" value="16" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
41 <param name="lambda" value="2" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
42 <output name="output" file="song_mammals.tre" ftype="newick"/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
43 <output name="log_output"> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
44 <assert_contents> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
45 <has_line line="Number of taxa: 37 (37 species)" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
46 <has_line line="gradient0: 1933" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
47 <has_line line="Number of Clusters after addition by distance: 1933" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
48 <has_line line="Final quartet score is: 25526915" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
49 </assert_contents> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
50 </output> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
51 <output name="branch_annotations" file="freqQuad.csv" ftype="tabular"/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
52 </test> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
53 <test> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
54 <param name="input1" value="song_primates.424.gene.tre"/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
55 <param name="branch_annotation_level_selector" value="0" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
56 <param name="lambda" value="2" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
57 <output name="output" file="song_primates.tre" ftype="newick"/> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
58 <output name="log_output"> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
59 <assert_contents> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
60 <has_line line="Number of taxa: 14 (14 species)" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
61 <has_line line="gradient0: 339" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
62 <has_line line="Number of Clusters after addition by distance: 339" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
63 <has_line line="Final quartet score is: 389734" /> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
64 </assert_contents> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
65 </output> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
66 </test> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
67 </tests> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
68 <help><![CDATA[ |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
69 Newick annotations |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
70 no annotations (-t 0): This turns off calculation and reporting of posterior probabilities and branch lengths. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
71 Quartet support (-t 1): The percentage of quartets in your gene trees that agree with a branch (normalized quartet support) give use a nice way of measuring the amount of gene tree conflict around a branch. Note that the local posterior probabilities are computed based on a transformation of normalized quartet scores (see Figure 2 of this paper). |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
72 Alternative quartet topologies (-t 8): Outputs q1, q2, q3; these three values show quartet support (as defined above) for the main topology (LR|SO), first alternative (RS|LO) and second alternative (RO|LS), respectively. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
73 Local posterior (-t 3): is the default where we show local posterior probability for the main topology. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
74 Alternative posteriors (-t 4): The output includes three local posterior probabilities: one for the main topology, and one for each of the two alternatives (RS|LO and RO|LS, in that order). The posterior of the three topologies adds up to 1. This is because of our locality assumption, which basically asserts that we assume the four groups around the branch (L, R, S, and O) are each correct and therefore, there are only three possible alternatives. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
75 Full annotation (-t 2): When you use this option, for each branch you get a lot of different measurements: |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
76 q1,q2,q3: these three values show quartet support (as defined in the description of -t 1) for the main topology, the first alternative, and the second alternative, respectively. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
77 f1, f2, f3: these three values show the total number of quartet trees in all the gene trees that support the main topology, the first alternative, and the second alternative, respectively. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
78 pp1, pp2, pp3: these three show the local posterior probabilities (as defined in the description of -t 4) for the main topology, the first alternative, and the second alternative, respectively. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
79 QC: this shows the total number of quartets defined around each branch (this is what our paper calls m). |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
80 EN: this is the effective number of genes for the branch. If you don't have any missing data, this would be the number of branches in your tree. When there are missing data, some gene trees might have nothing to say about a branch. Thus, the effective number of genes might be smaller than the total number of genes. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
81 Polytomy test (-t 10): runs an experimental test to see if a null hypothesis that the branch is a polytomy could be rejected. See this paper: doi:10.3390/genes9030132. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
82 |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
83 File export of branch annotations |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
84 Since it is often hard to know which branch is L and which branch is R, understanding branch annotations is a bit hard for most users. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
85 To help, we have added a feature for outputting some of the branch annotations into a .csv file. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
86 Note that we strongly suggest using DiscoVista to visualize the quartet frequencies. If you find DiscoVista hard to install and use, you can instead use these .csv files. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
87 |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
88 To get the .csv outputs, you can use -t 16 and -t 32. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
89 .csv output has the following format. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
90 The output file is always called freqQuad.csv and is written to the same directory as the input file (sorry for the ugliness!) |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
91 The file is tab-delimited. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
92 1st column: a dummy name for the node. Note that each three lines in a row have the same node number. Around each node, we have three possible unrooted toplogies (NNI rearrangements). We show stats for these three rearrangements. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
93 2nd column: the topology name for which we are giving the scores. Here, t1 is always the main topology (observed in your species tree) and t2 and t3 are the two alternatives. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
94 3rd column: Gives the actual topology with the format: {A}|{B}#{C}|{D}. This means that the quartet topology being scored is putting groups A and B together on one side, and groups C and D on the other side. Please remember that quartets are unrooted trees. Each of the groups is a comma-separate list of species. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
95 5th column: number of gene trees that match the the topology in this line. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
96 You will note that this number is not always an integer number. The reason is that in each gene tree, groups A, B, C, and D may not be together. Those gene trees still count as 1 unit, but they can contribute a fraction of that total of 1 to each of the tree topologies. So a gene tree may count as 0.7 for one topology, 0.2 for another, and 0.1 for the third. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
97 6th column: This is the total number of gene trees that had any useful information about this branch. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
98 If you have no missing data, this should equal the total number of gene trees. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
99 If you have missing data, some genes may be missing one of groups A, B, C, or D entirely. Those genes will be agnostic about this branch. This column gives the number of genes that have at least one species from each of A, B, C, and D. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
100 4th column is likely you are interested in and it depends on whether you used -t 16 or -t 32. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
101 -t 16: This column is the local posterior for the topology given in this line. Note that the local posterior probability is different from normalized quartet score. See Figure 2 of this paper. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
102 -t 32: This column is simply 5th column divided by 6 column. Thus, it gives the normalized quartet score for that topology. Note that the three lines with the same node name (1st column) will add up to one in their 4th column. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
103 |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
104 Prior hyper-parameter |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
105 Our calculations of the local posterior probabilities and branch lengths use a Yule prior model for the branch lengths of the species tree. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
106 The speciation rate (in coalescent units) of the Yule process (lambda) is by default set to 0.5, which results in a flat prior for the quartet frequencies in the [1/3,1] range. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
107 Using -c option one can adjust the hyper-parameter for the prior. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
108 For example, you might want to estimate lambda from the data after one run and plug the estimate prior in a subsequent run. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
109 We have not yet fully explored the impact of lambda on the posterior. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
110 For branch lengths, lambda acts as a pseudocount and can have a substantial impact on the estimated branch length for very long branches. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
111 More specifically, if there is no, or very little discordance around a branch, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
112 the MAP lengths of the branch (which is what we report) is almost fully determined by the prior. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
113 |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
114 Note that setting lambda to 0 results in reporting ML estimates of the branch lengths instead of MAP. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
115 However, for branches with no discordance, we cannot compute a branch lengths. |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
116 For these, we currently arbitrarily set ML to 10 coalescent units (we might change this in future versions). |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
117 |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
118 ]]></help> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
119 <citations> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
120 <citation type="bibtex"> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
121 @misc{githubASTRAL, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
122 author = {LastTODO, FirstTODO}, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
123 year = {TODO}, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
124 title = {ASTRAL}, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
125 publisher = {GitHub}, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
126 journal = {GitHub repository}, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
127 url = {https://github.com/smirarab/ASTRAL}, |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
128 }</citation> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
129 </citations> |
66ebc4b19d6c
"planemo upload for repository https://github.com/smirarab/ASTRAL commit 0f93f327c49e93d6af057973d68ba772ba5715dc-dirty"
padge
parents:
diff
changeset
|
130 </tool> |