Repository 'augustus'
hg clone https://toolshed.g2.bx.psu.edu/repos/bgruening/augustus

Changeset 4:4de31938431b (2017-10-20)
Previous changeset 3:f5075dee9d6b (2015-05-22) Next changeset 5:b3f5d0879dab (2019-05-23)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/augustus commit 2896dcfd180800d00ea413a59264ef8b11788b8e
modified:
augustus.xml
extract_features.py
test-data/human_augustus_protein_codingseq_introns_cds_codingseq.fasta
test-data/human_augustus_protein_codingseq_introns_cds_main.gtf
test-data/human_augustus_protein_codingseq_introns_cds_protein.fasta
test-data/human_augustus_utr-on.gff
test-data/human_augustus_utr-on.gtf
added:
macros.xml
test-data/annot.gff3
removed:
readme.rst
tool_dependencies.xml
b
diff -r f5075dee9d6b -r 4de31938431b augustus.xml
--- a/augustus.xml Fri May 22 04:55:25 2015 -0400
+++ b/augustus.xml Fri Oct 20 03:48:57 2017 -0400
[
b'@@ -1,17 +1,24 @@\n-<tool id="augustus" name="Augustus" version="3.1.0">\n-    <description>gene prediction for eukaryotic genomes</description>\n-    <parallelism method="multi" split_inputs="input_genome" split_mode="to_size" split_size="10" merge_outputs="output,protein_output,codingseq_output"></parallelism>\n-    <requirements>\n-        <requirement type="package" version="3.1">augustus</requirement>\n-    </requirements>\n-    <stdio>\n-        <exit_code range="1:" />\n-        <exit_code range=":-1" />\n-        <regex match="Error:" />\n-        <regex match="Exception:" />\n-    </stdio>\n-    <command>\n+<tool id="augustus" name="Augustus" profile="16.04" version="@VERSION@">\n+    <description>gene prediction for prokaryotic and eukaryotic genomes</description>\n+    <macros>\n+        <import>macros.xml</import>\n+    </macros>\n+    <expand macro="requirements"/>\n+    <command detect_errors="aggressive">\n <![CDATA[\n+        #if $model.augustus_mode == \'history\'\n+\n+            ## Using an augustus model from history, we need to unzip it and let augustus find it\n+\n+            cp -r "\\$AUGUSTUS_CONFIG_PATH/" augustus_dir/ &&\n+\n+            mkdir -p \'augustus_dir/species/\' &&\n+\n+            tar -C \'augustus_dir/species/\' -xzvf \'${model.custom_model}\' > /dev/null &&\n+\n+            export AUGUSTUS_CONFIG_PATH=`pwd`/augustus_dir/ &&\n+        #end if\n+\n         ## Augustus writes the protein and coding sequences as comment into the gff/gtf file an external\n         ## script is used to extract the sequences into additional files\n \n@@ -61,9 +68,15 @@\n             $input_genome\n             $utr\n             --genemodel=$genemodel\n-            --species=$organism\n+\n \n-        | tee $output\n+            #if $model.augustus_mode == \'history\'\n+                --species=local\n+            #else\n+                --species=$model.organism\n+            #end if\n+\n+        | tee \'$output\'\n         #if \'protein\' in str($outputs).split(\',\') or \'codingseq\' in str($outputs).split(\',\'):\n             | python $__tool_directory__/extract_features.py\n                 #if \'protein\' in str($outputs).split(\',\'):\n@@ -78,126 +91,139 @@\n     <inputs>\n         <param name="input_genome" type="data" format="fasta" label="Genome Sequence"/>\n         <param name="noInFrameStop" argument="--noInFrameStop" type="boolean"\n-            label="Don\'t report transcripts with in-frame stop codons (--noInFrameStop)"\n+            label="Don\'t report transcripts with in-frame stop codons"\n             truevalue="--noInFrameStop=true" falsevalue="--noInFrameStop=false" checked="false"\n-            help="Otherwise, intron-spanning stop codons could occur. (--noInFrameStop)" />\n+            help="Otherwise, intron-spanning stop codons could occur." />\n         <param name="singlestrand" type="boolean" argument="--singlestrand"\n             label="Predict genes independently on each strand"\n-            help="This allows overlapping genes on opposite strands. (--singlestrand)"\n+            help="This allows overlapping genes on opposite strands."\n             truevalue="--singlestrand=true" falsevalue="--singlestrand=false" checked="false" />\n \n         <param name="utr" type="boolean" argument="--UTR"\n             label="Predict the untranslated regions in addition to the coding sequence"\n             truevalue="--UTR=on" falsevalue="--UTR=off" checked="false"\n-            help="This currently works only for human, galdieria, toxoplasma and caenorhabditis. (--UTR)" />\n+            help="This currently works only for human, galdieria, toxoplasma and caenorhabditis." />\n+\n \n-        <param name="organism" label="Model Organism" type="select" multiple="false" format="text" help="Choose a specialised trainingset.">\n-            <option value="human">Homo sapiens</option>\n-            <option value="fly">Drosophila melanogaster</option>\n-            <option value="arabidopsis">Arabidopsis thaliana</option>\n-            <option value="brugia ">Brugia malayi</option>\n-            <opti'..b' name="genemodel" label="Gene Model" type="select"\n-            help="Gene Model to predict, for more information please refere to the help. (--genemodel)">\n+            help="Gene Model to predict, for more information please refere to the help.">\n             <option value="complete">complete</option>\n             <option value="partial">partial</option>\n             <option value="intronless">intronless</option>\n@@ -206,7 +232,7 @@\n         </param>\n \n         <param name="gff" type="boolean" label="GFF formated output"\n-            help="Standard output is GTF. (--gff3)"\n+            help="Standard output is GTF."\n             truevalue="--gff3=on" falsevalue="--gff3=off" checked="false" />\n \n         <param name="outputs" type="select" display="checkboxes" multiple="True" label="Output options">\n@@ -216,10 +242,7 @@\n             <option value="start">predicted start codons (--start)</option>\n             <option value="stop">predicted stop codons (--stop)</option>\n             <option value="cds" selected="true">CDS region (--cds)</option>\n-\n-            <validator type="no_options" message="Please select at least one output file." />\n         </param>\n-\n     </inputs>\n     <outputs>\n         <data format="gtf" name="output" label="${tool.name} on ${on_string}: GTF/GFF">\n@@ -262,37 +285,47 @@\n \n **What it does**\n \n-AUGUSTUS is a gene prediction program for eukaryotes written by Mario Stanke and Oliver Keller.\n+AUGUSTUS is a gene prediction program for prokaryotes and eukaryotes written by Mario Stanke and Oliver Keller.\n It can be used as an ab initio program, which means it bases its prediction purely on the\n sequence. AUGUSTUS may also incorporate hints on the gene structure coming from extrinsic sources\n such as EST, MS/MS, protein alignments and synthenic genomic alignments.\n \n------\n+\n+**Input**\n+\n+Input data for the gene prediction tool Augustus is a FASTA file with a genomic nucleotide sequence.\n+\n+\n+**Output**\n+\n+Augustus produces three output files: a FASTA file with predicted coding sequences, a FASTA file with predicted protein sequences and a gtf/GFF output file if selected.\n+\n \n **Parameters**\n \n-Gene Model::\n+Gene Model:\n \n-    partial      : allow prediction of incomplete genes at the sequence boundaries (default)\n-    intronless   : only predict single-exon genes like in prokaryotes and some eukaryotes\n-    complete     : only predict complete genes\n-    atleastone   : predict at least one complete gene\n-    exactlyone   : predict exactly one complete gene\n+partial:    allow prediction of incomplete genes at the sequence boundaries (default)\n+intronless: only predict single-exon genes like in prokaryotes and some eukaryotes\n+complete:   only predict complete genes\n+atleastone: predict at least one complete gene\n+exactlyone: predict exactly one complete gene\n \n \n \n **Example**\n \n-Suppose you have the following DNA formatted sequences::\n+Suppose you have the following DNA FASTA sequence:\n \n-    >Seq1\n-    cccgcggagcgggtaccacatcgctgcgcgatgtgcgagcgaacacccgggctgcgcccg\n-    ggtgttgcgctcccgctccgcgggagcgctggcgggacgctgcgcgtcccgctcaccaag\n-    cccgcttcgcgggcttggtgacgctccgtccgctgcgcttccggagttgcggggcttcgc\n-    cccgctaaccctgggcctcgcttcgctccgccttgggcctgcggcgggtccgctgcgctc\n-    ccccgcctcaagggcccttccggctgcgcctccaggacccaaccgcttgcgcgggcctgg\n+>Seq1\n+cccgcggagcgggtaccacatcgctgcgcgatgtgcgagcgaacacccgggctgcgcccg\n+ggtgttgcgctcccgctccgcgggagcgctggcgggacgctgcgcgtcccgctcaccaag\n+cccgcttcgcgggcttggtgacgctccgtccgctgcgcttccggagttgcggggcttcgc\n+cccgctaaccctgggcctcgcttcgctccgccttgggcctgcggcgggtccgctgcgctc\n+ccccgcctcaagggcccttccggctgcgcctccaggacccaaccgcttgcgcgggcctgg\n \n-Running this tool will produce this::\n+\n+Running this tool will produce this:\n \n     # ----- prediction on sequence number 1 (length = 1992969, name = scaffold1|size1992969) -----\n     #\n@@ -319,7 +352,5 @@\n \n ]]>\n     </help>\n-    <citations>\n-        <citation type="doi">10.1093/bioinformatics/btg1080</citation>\n-    </citations>\n+    <expand macro="citations"/>\n </tool>\n'
b
diff -r f5075dee9d6b -r 4de31938431b extract_features.py
--- a/extract_features.py Fri May 22 04:55:25 2015 -0400
+++ b/extract_features.py Fri Oct 20 03:48:57 2017 -0400
[
@@ -1,10 +1,10 @@
 #!/usr/bin/env python
 
-import os
+import argparse
 import sys
-import argparse
 import textwrap
 
+
 def main( args ):
     """
     Extract the protein and coding section from an augustus gff, gtf file
@@ -45,6 +45,22 @@
             if line.startswith('start gene'):
                 gene_name = line[11:].strip()
 
+            if protein_seq:
+                if line.endswith(']'):
+                    protein_seq += line[:-1]
+                    po.write( '>%s\n%s\n' % (gene_name, '\n'.join( textwrap.wrap( protein_seq, 80 ) ) ) )
+                    protein_seq = ''
+                else:
+                    protein_seq += line
+
+            if coding_seq:
+                if line.endswith(']'):
+                    coding_seq += line[:-1]
+                    co.write( '>%s\n%s\n' % (gene_name, '\n'.join( textwrap.wrap( coding_seq, 80 ) ) ) )
+                    coding_seq = ''
+                else:
+                    coding_seq += line
+
             if args.protein and line.startswith('protein sequence = ['):
                 if line.endswith(']'):
                     protein_seq = line[20:-1]
@@ -63,26 +79,12 @@
                     line = line[19:]
                     coding_seq = line
 
-            if protein_seq:
-                if line.endswith(']'):
-                    protein_seq += line[:-1]
-                    po.write( '>%s\n%s\n' % (gene_name, '\n'.join( textwrap.wrap( protein_seq, 80 ) ) ) )
-                    protein_seq = ''
-                else:
-                    protein_seq += line
-
-            if coding_seq:
-                if line.endswith(']'):
-                    coding_seq += line[:-1]
-                    co.write( '>%s\n%s\n' % (gene_name, '\n'.join( textwrap.wrap( coding_seq, 80 ) ) ) )
-                    coding_seq = ''
-                else:
-                    coding_seq += line
     if args.codingseq:
         co.close()
     if args.protein:
         po.close()
 
+
 if __name__ == '__main__':
     parser = argparse.ArgumentParser()
     parser.add_argument('-p', '--protein', help='Path to the protein file.')
@@ -90,4 +92,3 @@
 
     args = parser.parse_args()
     main( args )
-
b
diff -r f5075dee9d6b -r 4de31938431b macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Fri Oct 20 03:48:57 2017 -0400
b
@@ -0,0 +1,20 @@
+<?xml version="1.0"?>
+<macros>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="@VERSION@">augustus</requirement>
+            <yield />
+        </requirements>
+    </xml>
+
+    <token name="@VERSION@">3.2.3</token>
+
+    <xml name="citations">
+        <citations>
+            <citation type="doi">10.1093/bioinformatics/btg1080</citation>
+            <citation type="doi">10.1093/bioinformatics/btr010</citation>
+            <citation type="doi">10.1093/bioinformatics/btn013</citation>
+        </citations>
+    </xml>
+
+</macros>
b
diff -r f5075dee9d6b -r 4de31938431b readme.rst
--- a/readme.rst Fri May 22 04:55:25 2015 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,84 +0,0 @@
-Galaxy wrapper for Augustus
-===========================
-
-This wrapper is copyright 2012-2013 by Björn Grüning.
-
-This is a wrapper for the command line tool of Augustus_.
-
-.. _augustus: http://bioinf.uni-greifswald.de/augustus/
-
-AUGUSTUS is a program that predicts genes in eukaryotic genomic sequences.
-
-Oliver Keller, Martin Kollmar, Mario Stanke, Stephan Waack (2011)
-A novel hybrid gene prediction method employing protein multiple sequence alignments
-Bioinformatics, doi: 10.1093/bioinformatics/btr010
-
-Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008)
-Using native and syntenically mapped cDNA alignments to improve de novo gene finding
-Bioinformatics, doi: 10.1093/bioinformatics/btn013
-
-Mario Stanke and Stephan Waack (2003)
-Gene Prediction with a Hidden-Markov Model and a new Intron Submodel. 
-Bioinformatics, Vol. 19, Suppl. 2, pages ii215-ii225
-
-
-Installation
-============
-
-The recommended installation is by means of the toolshed_.
-If you need to install it manually here is a short introduction.
-
-.. _toolshed:  http://toolshed.g2.bx.psu.edu/view/bgruening/augustus
-
-
-Install or downlaod augustus from::
-
-    http://bioinf.uni-greifswald.de/augustus/binaries/
-
-and follow the installation instructions or copy the binaries into your $PATH. To install the wrapper copy the augustus folder in the galaxy tools folder and modify the tools_conf.xml file to make the tool available to Galaxy.
-
-For example::
-
-  <section name="Gene Prediction" id="gene_prediction">
-    <tool file="gene_prediction/tools/augustus/augustus.xml" />
-  </section>
-
-
-Set the *AUGUSTUS_CONFIG_PATH* to /path_to_augustus/augustus/config with::
-
-  export AUGUSTUS_CONFIG_PATH=/path_to_augustus/augustus/config
-
-or modify the wrapper and use the following additional commandline switch::
-
-  --AUGUSTUS_CONFIG_PATH=/path_to_augustus/augustus/config
-
-
-History
-=======
-
-- v0.1: Initial public release
-- v0.2: Added tool_dependencies.xml file and update the augustus version (thanks to James Johnson)
-- v0.3: upgrade to augustus 2.7, added new organisms and new parameters, output additional sequence files
-- v0.3.1: added parallelism and changed the output parameters from boolean to a select box
-
-Licence (MIT)
-=============
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
-
b
diff -r f5075dee9d6b -r 4de31938431b test-data/annot.gff3
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/annot.gff3 Fri Oct 20 03:48:57 2017 -0400
b
@@ -0,0 +1,41 @@
+##gff-version 3
+HS08198 maker gene 352 1848 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0;Name=maker-HS08198-exonerate_est2genome-gene-0.0
+HS08198 maker mRNA 352 1848 2869 + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1;Parent=maker-HS08198-exonerate_est2genome-gene-0.0;Name=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1;_AED=0.00;_eAED=0.00;_QI=70|1|1|1|0|0|7|0|192
+HS08198 maker exon 352 397 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:exon:9;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker exon 421 582 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:exon:10;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker exon 812 894 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:exon:11;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker exon 1053 1123 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:exon:12;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker exon 1208 1315 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:exon:13;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker exon 1587 1688 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:exon:14;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker exon 1772 1848 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:exon:15;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker five_prime_UTR 352 397 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:five_prime_utr;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker five_prime_UTR 421 444 . + . ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:five_prime_utr;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker CDS 445 582 . + 0 ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker CDS 812 894 . + 0 ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker CDS 1053 1123 . + 1 ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker CDS 1208 1315 . + 2 ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker CDS 1587 1688 . + 2 ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+HS08198 maker CDS 1772 1848 . + 2 ID=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS08198-exonerate_est2genome-gene-0.0-mRNA-1
+###
+HS04636 maker gene 1813 6903 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0;Name=maker-HS04636-exonerate_est2genome-gene-0.0
+HS04636 maker mRNA 1813 6903 8728 + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1;Parent=maker-HS04636-exonerate_est2genome-gene-0.0;Name=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1;_AED=0.00;_eAED=0.00;_QI=49|1|1|1|0|0|9|0|572
+HS04636 maker exon 1813 1934 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:0;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 2055 2198 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:1;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 2852 2995 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:2;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 3426 3607 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:3;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 4340 4423 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:4;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 4543 4789 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:5;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 5072 5358 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:6;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 5860 6007 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:7;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker exon 6494 6903 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:exon:8;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker five_prime_UTR 1813 1861 . + . ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:five_prime_utr;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 1862 1934 . + 0 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 2055 2198 . + 2 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 2852 2995 . + 2 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 3426 3607 . + 2 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 4340 4423 . + 0 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 4543 4789 . + 0 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 5072 5358 . + 2 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 5860 6007 . + 0 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+HS04636 maker CDS 6494 6903 . + 2 ID=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1:cds;Parent=maker-HS04636-exonerate_est2genome-gene-0.0-mRNA-1
+###
b
diff -r f5075dee9d6b -r 4de31938431b test-data/human_augustus_protein_codingseq_introns_cds_codingseq.fasta
--- a/test-data/human_augustus_protein_codingseq_introns_cds_codingseq.fasta Fri May 22 04:55:25 2015 -0400
+++ b/test-data/human_augustus_protein_codingseq_introns_cds_codingseq.fasta Fri Oct 20 03:48:57 2017 -0400
b
@@ -1,35 +1,33 @@
 >HS04636.g1
 atgctcgcccgcgccctgctgctgtgcgcggtcctggcgctcagccatacagcaaatccttgctgttcccacccatgtca
-tgctcgcccgcgccctgctgctgtgcgcggtcctggcgctcagccatacagcaaatccttgctgttcccacccatgtcaa
-aaccgaggtgtatgtatgagtgtgggatttgaccagtataagtgcgattgtacccggacaggattctatggagaaaactg
-ctcaacaccggaatttttgacaagaataaaattatttctgaaacccactccaaacacagtgcactacatacttacccact
-tcaagggattttggaacgttgtgaataacattcccttccttcgaaatgcaattatgagttatgtcttgacatccagatca
-catttgattgacagtccaccaacttacaatgctgactatggctacaaaagctgggaagccttctctaacctctcctatta
-tactagagcccttcctcctgtgcctgatgattgcccgactcccttgggtgtcaaaggtaaaaagcagcttcctgattcaa
-atgagattgtggaaaaattgcttctaagaagaaagttcatccctgatccccagggctcaaacatgatgtttgcattcttt
-gcccagcacttcacgcatcagtttttcaagacagatcataagcgagggccagctttcaccaacgggctgggccatggggt
-ggacttaaatcatatttacggtgaaactctggctagacagcgtaaactgcgccttttcaaggatggaaaaatgaaatatc
-agataattgatggagagatgtatcctcccacagtcaaagatactcaggcagagatgatctaccctcctcaagtccctgag
-catctacggtttgctgtggggcaggaggtctttggtctggtgcctggtctgatgatgtatgccacaatctggctgcggga
-acacaacagagtatgcgatgtgcttaaacaggagcatcctgaatggggtgatgagcagttgttccagacaagcaggctaa
-tactgataggagagactattaagattgtgattgaagattatgtgcaacacttgagtggctatcacttcaaactgaaattt
-gacccagaactacttttcaacaaacaattccagtaccaaaatcgtattgctgctgaatttaacaccctctatcactggca
-tccccttctgcctgacacctttcaaattcatgaccagaaatacaactatcaacagtttatctacaacaactctatattgc
-tggaacatggaattacccagtttgttgaatcattcaccaggcaaattgctggcagggttgctggtggtaggaatgttcca
-cccgcagtacagaaagtatcacaggcttccattgaccagagcaggcagatgaaataccagtcttttaatgagtaccgcaa
-acgctttatgctgaagccctatgaatcatttgaagaacttacaggagaaaaggaaatgtctgcagagttggaagcactct
-atggtgacatcgatgctgtggagctgtatcctgcccttctggtagaaaagcctcggccagatgccatctttggtgaaacc
-atggtagaagttggagcaccattctccttgaaaggacttatgggtaatgttatatgttctcctgcctactggaagccaag
-cacttttggtggagaagtgggttttcaaatcatcaacactgcctcaattcagtctctcatctgcaataacgtgaagggct
-gtccctttacttcattcagtgttccagatccagagctcattaaaacagtcaccatcaatgcaagttcttcccgctccgga
-ctagatgatatcaatcccacagtactactaaaagaacgttcgactgaactgtag
+aaaccgaggtgtatgtatgagtgtgggatttgaccagtataagtgcgattgtacccggacaggattctatggagaaaact
+gctcaacaccggaatttttgacaagaataaaattatttctgaaacccactccaaacacagtgcactacatacttacccac
+ttcaagggattttggaacgttgtgaataacattcccttccttcgaaatgcaattatgagttatgtcttgacatccagatc
+acatttgattgacagtccaccaacttacaatgctgactatggctacaaaagctgggaagccttctctaacctctcctatt
+atactagagcccttcctcctgtgcctgatgattgcccgactcccttgggtgtcaaaggtaaaaagcagcttcctgattca
+aatgagattgtggaaaaattgcttctaagaagaaagttcatccctgatccccagggctcaaacatgatgtttgcattctt
+tgcccagcacttcacgcatcagtttttcaagacagatcataagcgagggccagctttcaccaacgggctgggccatgggg
+tggacttaaatcatatttacggtgaaactctggctagacagcgtaaactgcgccttttcaaggatggaaaaatgaaatat
+cagataattgatggagagatgtatcctcccacagtcaaagatactcaggcagagatgatctaccctcctcaagtccctga
+gcatctacggtttgctgtggggcaggaggtctttggtctggtgcctggtctgatgatgtatgccacaatctggctgcggg
+aacacaacagagtatgcgatgtgcttaaacaggagcatcctgaatggggtgatgagcagttgttccagacaagcaggcta
+atactgataggagagactattaagattgtgattgaagattatgtgcaacacttgagtggctatcacttcaaactgaaatt
+tgacccagaactacttttcaacaaacaattccagtaccaaaatcgtattgctgctgaatttaacaccctctatcactggc
+atccccttctgcctgacacctttcaaattcatgaccagaaatacaactatcaacagtttatctacaacaactctatattg
+ctggaacatggaattacccagtttgttgaatcattcaccaggcaaattgctggcagggttgctggtggtaggaatgttcc
+acccgcagtacagaaagtatcacaggcttccattgaccagagcaggcagatgaaataccagtcttttaatgagtaccgca
+aacgctttatgctgaagccctatgaatcatttgaagaacttacaggagaaaaggaaatgtctgcagagttggaagcactc
+tatggtgacatcgatgctgtggagctgtatcctgcccttctggtagaaaagcctcggccagatgccatctttggtgaaac
+catggtagaagttggagcaccattctccttgaaaggacttatgggtaatgttatatgttctcctgcctactggaagccaa
+gcacttttggtggagaagtgggttttcaaatcatcaacactgcctcaattcagtctctcatctgcaataacgtgaagggc
+tgtccctttacttcattcagtgttccagatccagagctcattaaaacagtcaccatcaatgcaagttcttcccgctccgg
+actagatgatatcaatcccacagtactactaaaagaacgttcgactgaactgtag
 >HS08198.g2
-atgctgccccctgggactgcgaccctcttgactctgctcctggcagctggctcgctgggccagaagcctcagaggccaca
-tgctgccccctgggactgcgaccctcttgactctgctcctggcagctggctcgctgggccagaagcctcagaggccacgc
-cggcccgcatcccccatcagcaccatccagcccaaggccaattttgatgcgcagcaggagcagggccaccgggccgaggc
-caccacactgcatgtggctccccagggcacagccatggctgtcagtaccttccgaaagctggatgggatctgctggcagg
-tgcgccagctctatggagacacaggggtcctcggccgcttcctgcttcaagcccgaggcgcccgaggggctgtgcacgtg
-gttgtcgctgagaccgactaccagagtttcgctgtcctgtacctggagcgggcggggcagctgtcagtgaagctctacgc
-ccgctcgctccctgtgagcgactcggtcctgagtgggtttgagcagcgggtccaggaggcccacctgactgaggaccaga
-tcttctacttccccaagtacggcttctgcgaggctgcagaccagttccacgtcctggacggtgagtgcacagcgggggca
-agcatggcggcgtggtga
+atgctgccccctgggactgcgaccctcttgactctgctcctggcagctggctcgctgggccagaagcctcagaggccacg
+ccggcccgcatcccccatcagcaccatccagcccaaggccaattttgatgcgcagcaggagcagggccaccgggccgagg
+ccaccacactgcatgtggctccccagggcacagccatggctgtcagtaccttccgaaagctggatgggatctgctggcag
+gtgcgccagctctatggagacacaggggtcctcggccgcttcctgcttcaagcccgaggcgcccgaggggctgtgcacgt
+ggttgtcgctgagaccgactaccagagtttcgctgtcctgtacctggagcgggcggggcagctgtcagtgaagctctacg
+cccgctcgctccctgtgagcgactcggtcctgagtgggtttgagcagcgggtccaggaggcccacctgactgaggaccag
+atcttctacttccccaagtacggcttctgcgaggctgcagaccagttccacgtcctggacggtgagtgcacagcgggggc
+aagcatggcggcgtggtga
b
diff -r f5075dee9d6b -r 4de31938431b test-data/human_augustus_protein_codingseq_introns_cds_main.gtf
--- a/test-data/human_augustus_protein_codingseq_introns_cds_main.gtf Fri May 22 04:55:25 2015 -0400
+++ b/test-data/human_augustus_protein_codingseq_introns_cds_main.gtf Fri Oct 20 03:48:57 2017 -0400
b
@@ -1,6 +1,6 @@
-# This output was generated with AUGUSTUS (version 3.1.0).
-# AUGUSTUS is a gene prediction tool written by Mario Stanke (mario.stanke@uni-greifswald.de),
-# Oliver Keller, Stefanie König and Lizzy Gerischer.
+# This output was generated with AUGUSTUS (version 3.2.3).
+# AUGUSTUS is a gene prediction tool written by M. Stanke (mario.stanke@uni-greifswald.de),
+# O. Keller, S. König, L. Gerischer and L. Romoth.
 # Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008),
 # Using native and syntenically mapped cDNA alignments to improve de novo gene finding
 # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013
b
diff -r f5075dee9d6b -r 4de31938431b test-data/human_augustus_protein_codingseq_introns_cds_protein.fasta
--- a/test-data/human_augustus_protein_codingseq_introns_cds_protein.fasta Fri May 22 04:55:25 2015 -0400
+++ b/test-data/human_augustus_protein_codingseq_introns_cds_protein.fasta Fri Oct 20 03:48:57 2017 -0400
b
@@ -1,15 +1,13 @@
 >HS04636.g1
-MLARALLLCAVLALSHTANPCCSHPCQNRGVCMSVGFDQYKCDCTRTGFYGENCSTPEFLTRIKLFLKPTPNTVHYILML
-ARALLLCAVLALSHTANPCCSHPCQNRGVCMSVGFDQYKCDCTRTGFYGENCSTPEFLTRIKLFLKPTPNTVHYILTHFK
-GFWNVVNNIPFLRNAIMSYVLTSRSHLIDSPPTYNADYGYKSWEAFSNLSYYTRALPPVPDDCPTPLGVKGKKQLPDSNE
-IVEKLLLRRKFIPDPQGSNMMFAFFAQHFTHQFFKTDHKRGPAFTNGLGHGVDLNHIYGETLARQRKLRLFKDGKMKYQI
-IDGEMYPPTVKDTQAEMIYPPQVPEHLRFAVGQEVFGLVPGLMMYATIWLREHNRVCDVLKQEHPEWGDEQLFQTSRLIL
-IGETIKIVIEDYVQHLSGYHFKLKFDPELLFNKQFQYQNRIAAEFNTLYHWHPLLPDTFQIHDQKYNYQQFIYNNSILLE
-HGITQFVESFTRQIAGRVAGGRNVPPAVQKVSQASIDQSRQMKYQSFNEYRKRFMLKPYESFEELTGEKEMSAELEALYG
-DIDAVELYPALLVEKPRPDAIFGETMVEVGAPFSLKGLMGNVICSPAYWKPSTFGGEVGFQIINTASIQSLICNNVKGCP
-FTSFSVPDPELIKTVTINASSSRSGLDDINPTVLLKERSTEL
+MLARALLLCAVLALSHTANPCCSHPCQNRGVCMSVGFDQYKCDCTRTGFYGENCSTPEFLTRIKLFLKPTPNTVHYILTH
+FKGFWNVVNNIPFLRNAIMSYVLTSRSHLIDSPPTYNADYGYKSWEAFSNLSYYTRALPPVPDDCPTPLGVKGKKQLPDS
+NEIVEKLLLRRKFIPDPQGSNMMFAFFAQHFTHQFFKTDHKRGPAFTNGLGHGVDLNHIYGETLARQRKLRLFKDGKMKY
+QIIDGEMYPPTVKDTQAEMIYPPQVPEHLRFAVGQEVFGLVPGLMMYATIWLREHNRVCDVLKQEHPEWGDEQLFQTSRL
+ILIGETIKIVIEDYVQHLSGYHFKLKFDPELLFNKQFQYQNRIAAEFNTLYHWHPLLPDTFQIHDQKYNYQQFIYNNSIL
+LEHGITQFVESFTRQIAGRVAGGRNVPPAVQKVSQASIDQSRQMKYQSFNEYRKRFMLKPYESFEELTGEKEMSAELEAL
+YGDIDAVELYPALLVEKPRPDAIFGETMVEVGAPFSLKGLMGNVICSPAYWKPSTFGGEVGFQIINTASIQSLICNNVKG
+CPFTSFSVPDPELIKTVTINASSSRSGLDDINPTVLLKERSTEL
 >HS08198.g2
-MLPPGTATLLTLLLAAGSLGQKPQRPRRPASPISTIQPKANFDAQQEQGHRAEATTLHVAPQGTAMAVSTFRKLDGICML
-PPGTATLLTLLLAAGSLGQKPQRPRRPASPISTIQPKANFDAQQEQGHRAEATTLHVAPQGTAMAVSTFRKLDGICWQVR
-QLYGDTGVLGRFLLQARGARGAVHVVVAETDYQSFAVLYLERAGQLSVKLYARSLPVSDSVLSGFEQRVQEAHLTEDQIF
-YFPKYGFCEAADQFHVLDGECTAGASMAAW
+MLPPGTATLLTLLLAAGSLGQKPQRPRRPASPISTIQPKANFDAQQEQGHRAEATTLHVAPQGTAMAVSTFRKLDGICWQ
+VRQLYGDTGVLGRFLLQARGARGAVHVVVAETDYQSFAVLYLERAGQLSVKLYARSLPVSDSVLSGFEQRVQEAHLTEDQ
+IFYFPKYGFCEAADQFHVLDGECTAGASMAAW
b
diff -r f5075dee9d6b -r 4de31938431b test-data/human_augustus_utr-on.gff
--- a/test-data/human_augustus_utr-on.gff Fri May 22 04:55:25 2015 -0400
+++ b/test-data/human_augustus_utr-on.gff Fri Oct 20 03:48:57 2017 -0400
b
@@ -1,7 +1,7 @@
 ##gff-version 3
-# This output was generated with AUGUSTUS (version 3.1.0).
-# AUGUSTUS is a gene prediction tool written by Mario Stanke (mario.stanke@uni-greifswald.de),
-# Oliver Keller, Stefanie König and Lizzy Gerischer.
+# This output was generated with AUGUSTUS (version 3.2.3).
+# AUGUSTUS is a gene prediction tool written by M. Stanke (mario.stanke@uni-greifswald.de),
+# O. Keller, S. König, L. Gerischer and L. Romoth.
 # Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008),
 # Using native and syntenically mapped cDNA alignments to improve de novo gene finding
 # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013
b
diff -r f5075dee9d6b -r 4de31938431b test-data/human_augustus_utr-on.gtf
--- a/test-data/human_augustus_utr-on.gtf Fri May 22 04:55:25 2015 -0400
+++ b/test-data/human_augustus_utr-on.gtf Fri Oct 20 03:48:57 2017 -0400
b
@@ -1,6 +1,6 @@
-# This output was generated with AUGUSTUS (version 3.1.0).
-# AUGUSTUS is a gene prediction tool written by Mario Stanke (mario.stanke@uni-greifswald.de),
-# Oliver Keller, Stefanie König and Lizzy Gerischer.
+# This output was generated with AUGUSTUS (version 3.2.3).
+# AUGUSTUS is a gene prediction tool written by M. Stanke (mario.stanke@uni-greifswald.de),
+# O. Keller, S. König, L. Gerischer and L. Romoth.
 # Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008),
 # Using native and syntenically mapped cDNA alignments to improve de novo gene finding
 # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013
b
diff -r f5075dee9d6b -r 4de31938431b tool_dependencies.xml
--- a/tool_dependencies.xml Fri May 22 04:55:25 2015 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,6 +0,0 @@
-<?xml version="1.0"?>
-<tool_dependency>
-    <package name="augustus" version="3.1">
-        <repository changeset_revision="cc0bd4986b48" name="package_augustus_3_1" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
-    </package>
-</tool_dependency>