Next changeset 1:37b5e1f0b544 (2020-07-16) |
Commit message:
planemo upload for repository https://github.com/ogotoh/spaln commit af52c6b4c904f6291953881111d415d5b86ee4d6 |
added:
spaln.xml test-data/genome.fasta test-data/output1.bed12 test-data/output1.tabular test-data/output1_gff_genes.gff3 test-data/output1_gff_matches.gff3 test-data/query.fasta |
b |
diff -r 000000000000 -r 95ea8d97abb4 spaln.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/spaln.xml Fri Jan 11 18:15:21 2019 -0500 |
[ |
@@ -0,0 +1,84 @@ +<tool id="spaln" name="Spaln: align cDNA or Protein to genome" version="@TOOL_VERSION@+galaxy0"> + <description>Maps and aligns a set of cDNA or protein sequences onto a whole genomic sequence.</description> + <macros> + <token name="@TOOL_VERSION@">2.3.2</token> + </macros> + <edam_topics> + <edam_topic>topic_3512</edam_topic> + </edam_topics> + <requirements> + <requirement type="package" version="@TOOL_VERSION@">spaln</requirement> + </requirements> + <command detect_errors="aggressive"><![CDATA[ + spaln -t\${GALAXY_SLOTS:-1} -O$format -o '$output1' '$genome' '$query' + ]]></command> + <inputs> + <param type="data" name="genome" format="fasta" label="Genome sequence to search (FASTA format)" /> + <param type="data" name="query" format="fasta" label="Query sequence(s) (protein or cDNA)" /> + <param argument="-O" type="select" name="format" label="Output format"> + <option value="0">GFF3 format genes</option> + <option value="2">GFF3 format matches</option> + <option value="3">BED format</option> + <option value="4">Tabular format exon information</option> + </param> + </inputs> + <outputs> + <data name="output1" format="tabular"> + <change_format> + <!-- these values correspond with the format options of the spaln command, not all of which are current supported --> + <when input="format" value="0" format="gff3" /> + <when input="format" value="2" format="gff3" /> + <when input="format" value="3" format="bed12" /> + <when input="format" value="4" format="tabular" /> + </change_format> + <!-- <actions> .. <conditional> .. <when> .. <action> current does not work in Galaxy, + something that https://github.com/galaxyproject/galaxy/pull/7197 is addressing, so this is + commented out till that is merged + <actions> + <conditional name="format"> + <when value="4"> + <action type="metadata" name="column_names" default="rID,gID,%id,ExonL,MisMch,Unpair,ref_l,ref_r,tgt_l,tgt_r,eScore,IntrnL,iScore,Sig3/I,Sig5/T # - X P DiNuc" /> + </when> + </conditional> + </actions> + --> + </data> + </outputs> + <tests> + <test> + <param name="genome" ftype="fasta" value="genome.fasta" /> + <param name="query" ftype="fasta" value="query.fasta" /> + <param name="format" value="0"/> + <output name="output1" value="output1_gff_genes.gff3" /> + </test> + <test> + <param name="genome" ftype="fasta" value="genome.fasta" /> + <param name="query" ftype="fasta" value="query.fasta" /> + <param name="format" value="2"/> + <output name="output1" value="output1_gff_matches.gff3" /> + </test> + <test> + <param name="genome" ftype="fasta" value="genome.fasta" /> + <param name="query" ftype="fasta" value="query.fasta" /> + <param name="format" value="3"/> + <output name="output1" value="output1.bed12" /> + </test> + <test> + <param name="genome" ftype="fasta" value="genome.fasta" /> + <param name="query" ftype="fasta" value="query.fasta" /> + <param name="format" value="4"/> + <output name="output1" value="output1.tabular" /> + </test> + </tests> + <help><![CDATA[ + Spaln_ (space-efficient spliced alignment) is a stand-alone program that maps and aligns a set of cDNA or + protein sequences onto a whole genomic sequence in a single job. + + This Galaxy wrapper currently only supports the default (i.e. *-O3*) algorithm for Spaln with default parameters. + + .. _Spaln: http://www.genome.ist.i.kyoto-u.ac.jp/~aln_user/spaln/ + ]]></help> + <citations> + <citation type="doi">0.1093/nar/gkn105</citation> + </citations> +</tool> |
b |
diff -r 000000000000 -r 95ea8d97abb4 test-data/genome.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/genome.fasta Fri Jan 11 18:15:21 2019 -0500 |
b |
b'@@ -0,0 +1,1000 @@\n+>scaffold_1\n+TGCTTTTCTGAGATTTATGTCAGCTCCCCATTGGGAGATACAGGAGAATCCAATATATTC\n+CTGTCTCGCTTCTTTTATATTTATCCTTTCTACACCTGACATCCTCAGTGATTGAAGTGA\n+CAAAAAGTGGAGCGCACGCAGTGGTCATTACCCTCCAATGGTACTTCTAATTAAGGAAAG\n+ATTTTTTGCATTCACTGAGCAAAACACTTATTTGCATGAATGGAAAATCATAAATGAGGG\n+GTCCATTAAACAAATTTCCTAATTGTTTGCTTTTTTTTCTTCCTACTTCACCATCCCTCT\n+AAAGCTATTACTCTCTATTCTACCCCATTATCGAGTGCACAAACACCAGCCCCAAATTGT\n+CTTATCTCTGCTTTGATAAATGATATTTTTTTCTCTTATAATTGTGTTTCTCTCTAGATG\n+TGCGGTGTCCATCAAGACACTGGATGTCACGTGGTCACTCCTGTGAAGAGCGAACTGTGT\n+GGAACCCGAAGTACTGTGTGGTTGCTGACTGTCAGATGCTGCTTCTGAATGAGGAGGAGG\n+TGGTGAGAGCAGACAGCACAATCTCTTGTCTGGCATGTTCCTCTGTGTCACCATTGTCTC\n+TCTCATCTGCTCGTGTGTGTGTGTGTGTGTGTCCTTGTCAATGTCATTACACAATTTATG\n+TTGGTGCACTGCATGTCAGAGTCTGAACTTTGTTGGACATCTACTTTCTGTCACCTGATA\n+CCTCATACTTTACACTCTAATCCCTTTTTCCTTTCTAACTGCTGCTGTGTTAAGCTGTCA\n+TATTAATATACTAAATAATGATAATATTAATTCTAATAATGATAGTGAATGGAGATTCAC\n+AATGAAGAAACACAAGGTCCAGACTGAACCCCTGTGCTGTGTGAAGAGTTCACTCTACAT\n+TTACATTCATCCCACATCAGAGACCAGCAATAGCCAGGTTAAGCAGAGCAAGGCTGAGTC\n+TGGCTCTTTGCCTCTGTTGTTTTGATTAGTGTCACACTGGATTATGCTAGTTTGTGTGAG\n+ATTAGAGGTCCTGTTGTTACGAGCAAATCAGCAGTCAGCAGGGTAATCTAAATTACATTG\n+TTCTGTCGGCAATATCCTCTCCTCGCTCAACAGCTTTGTGTGAGCTCATATTTAAAGCCC\n+CCACAGTAGTGCAGTGCATAAAATCATGCAGATACAGATCAGAAGCTTCAGGTAATGTTT\n+ACATCAAACATCAGGGGGAAAATGTGATCTCAGTGCCTCTGACCGTGGTGTGATTGTTGG\n+TGCCGGACAGGCTGGTTTGAGTATTTCTAAAACTGCTGATCTCCTGGGATTTTCACACAC\n+GGCATTCTCTAGAGTTTACTCAGAACGGTGTGGAAAGCAAAAAAACATCCCGCGAGCTGC\n+AATCCTGCGGATGGAAACACCTTGTTGATGGGATATGTCAGAGGAATGGCCAGGCTGGAT\n+CAATCTGACAGAAAGGCGGTAACTCAGATAAGCACTCTCTACAACTGTGGTGAGCAGAAA\n+AGCGTTCTCAGAATGCACAACACGTTCAACCTTGAGGAAGATGTTGCTACAGCAGCAGAT\n+GAAGACCACGTCTGGTTCCACTCCTGTCAGCCAAGAACATCTCAGACTGCACAGGACACC\n+AAAACAAAAACACATCCTGTTTTCTACTGGTGGTAGAGTCACAATTTGGCAATAAGATAA\n+ATCCATGGACCCAACTTGCCTTGTGTCAATAGACCAAGCTGCTGGTGGTCTTGGGGAATG\n+TTTTCTTTACACTTTCACACTATCGGCCTATATAAAATCCTATTATAAACTGCTGTACAG\n+TGCATTGGGTTTGATAAGCCCTCTAAGTCTGTATATCATGATCTCATTGATACCTGCGGC\n+AATACACCCCCACAAACGCAGCTCCCTGCATTTTAAGTATTATAGAGAGTAATTTCACTG\n+TCCATGTCTTTTTTGATCATAAAGCAGGTCTAGGTGCTGTATACAACACTGTATTGAAAT\n+GCTGAAGCAGGTCTAGGTGCTGTATACAACACTGTATTGAAATGCTGAAGCCAATATATC\n+AATCTATCTGTCTATATTTTATGAAATATCAGAGCATTTTAGTCCAAATTTGTCTGTTTT\n+GTTCATTGCAATGCTGACTGCTTAACATTTTCCTCAGTGGTGGCCATCACCACAGCATTT\n+ACTGGTGAGTTTTACCAAGCTACAGTGGGCCACAATGAGTTACCTGTTATTGGCCTGGCT\n+CTATGGCATGCAGAAAACAGTCAGCCAATCAGAGGACAGACTCAGAGACAGACACAAAGT\n+GCCCTGTTCTTGTTAGAGCAGAGATAAATGAGACAGAGGAGATGTAAAACTATACTGAGA\n+TGGTTTTTTGGTTCTTAAAACCACAAATATATTGTATTACGGATATCAAAACTTCAAATA\n+AAACCAGTAAAGTGTAAAACATGGGACCTCTAAATGAAGGGCTGTTTTGTTTCGTAGTTC\n+TAGATTATGTCACTATGTGGCCTCGGTCTCTGTCTGCGTAAAGCGGCTACATGTAGAATT\n+TGACCCACTTTGGTGCCCACATATGGTAACTAAAACACTACAGACAGTATGCACTCCAAC\n+CCTATATAATTTATGTCCTTCAGTGAAGCCTACAAAATGTGCAGCATGATTTGCTATGAT\n+TAATACCTAGAATTATATTAAATTTTAGAAGTTTAGAGAGATGGCTTATACCTTTTTCTG\n+AGCATGGAGTCATCTCATGTAATTTGTCACATACCTTTGGCCAGCTTAAACCTGGTCATT\n+CCAGTGAGAGCTGCTCACCCAAATGTTTCTGTATGCACCTCCTGCTGTGGGTGCCAATAG\n+CTCATGCAAGTTGGTGTCTTTCAACTAAGGCCACTATGTGAGGACCATCAGCAGCAAATT\n+AAATTAGAAGTGCCTTGGAGTTTCTCAGGCCCTCTTCTATGATCATTAAGGTCTCAGTGA\n+CAGAACAGTGCCCCTTTGAGGGACTATGGCATCTTGAGCACTTAAGTTGGCCGAATGTTT\n+GATCTCAAATATGAGTGCACTGTTTCAAAGTCACAAAAGCCTCTGGACAAGGCATAGTTA\n+CTGGGCTTGGTTAACCTTTTTTTCATACCGGCGTGACTGCTGGAACTTGGAACATGTAGC\n+CTAAGTTTCCCTTTGTCTGCAATTACTGAGGTATGCCATGTTGAAATAGAACAATAATTG\n+CAGGGAGGAATTATTCCAATCGACCCATCGGCAGGCTTTCCAATACAGTGCTTTTTGTTT\n+CACAGCAACAAAGAACAAGAGCTTTTAAATGCATCCATCTGGACCCTGACTATGAAAGGT\n+CATTGGTAACGCTGCTGGATTTCTGTTATGTCAGCAAACTGCAGGTCAAAGCGATGATAC\n+AGTCTTATAATGGCTTTCTCCAAGTGAAGGTGGGATAACATGGTTTAAACAAGCTCAGTT\n+AAATGGATCAGAGCATCAACTGCTGTGAACAAGCAATCACACGGTCAAGGTCAAACATTT\n+ACACTTCTGAGAGATCTGGAGAGTATGTCATGGCAGTATTGCTTTTCAGTTATTTCAGTA\n+ACTGATTACGCCTTGTACTTAGTCTCAGAATTAGTGATTTGATTCAAAGTGTTTTATATA\n+TGTATATTTCAAAGCAAAAATACAGCTTAGGTAAAGCTCCTTAGACTCATGCAGCCTAAT\n+TTACTGTAGACATTCCTCCATGTACAGTACTGTGCAAATGTTTTAGGCAGTTTTAGGCAC\n+TAAAGGTGAACTGAGGATGCAGTCCCACGATTAATTTTTATTCATCAGTTAACCTCATGT\n+GAAGTGTAGTAAACAGAAAAAACCTAAATCAGATCAGTATTTCTTATGACCCCCCTCCCC'..b'AACATACATTATATACTACAGTGTAGTGTG\n+TGTGAGTGTGAGAAGGATTTACTTTATAATGCAGTTTCATCTTGATGAGTCACACTGCCA\n+CACATGATTAACACTAATTTCATTAGTTTCCAATGTTGCACACAGTCAGAGATCTCATTT\n+AAATAATCTAACATTGCCTCAGTGATGCAATGACCGCATATGTTTTACAAAGGCTGATGA\n+TTATATCACCGTATCTGACCTAGTTAGACACATTTTTTACATTTTTATTCATGTTGTTAG\n+AATGCCTTGTACTCAAAGCTATAATACATGTACAGATCATAGCAGCCTACACAACTTTCC\n+ATTTATCACACAGGGTTACATAAGTCCACCAGCTGCCTCCAATATAACATACTGATAATT\n+TGCTCTGTACCTATGAGTTAGCAGTTAGCAGTGATGGCTATCTGAAATCTGTGGGGACTT\n+GCACGCTCAACAACACTTGCATTCCACTTGGACATGTCCAGATTTGCTGCTTCCACACAT\n+ATGCTCTGGAGCTCTTTCACATCTCTTTCATGCTGACCTGATACTGTGCTGTACTGTGTC\n+TCCAGGTTAAAAAAAGAAATTATATAGAAACACACAGGTTAAAAAGATAACAGATACAGA\n+CAAGTTCAGACAAGTTCAGTTAACACGGAAAGGAATGTGAAAAATAAGGAACTGAAAGCT\n+ACAGGCTTTTTACATATTTATGGAGGAATAGGTAATAGTACGCAATCCTGTGTTAACGTC\n+TTTGAATCAAATCAAATATAAAGTCAAGAAATAAATTGAAGATATGACCAACAAACACTT\n+TTTTTTTCAATTTCATGAAACTTTTGCCTTTGATCAATACGAACAGATGTTGAAAGCTTT\n+GAACATCTTAAGCTAAGGTTTGGGTTTATTACGTTTGAATAAAAAAGTTGAACCTTTATC\n+AGAACTGTCACTTACAAAGCATAAATTTCTTGAGTTTGAAATTGAGCCAGGTCAGACTAG\n+TTTGAGTGCAGGCCTGTTTGGCACCTCAGACTCCACACCCTTATTTCCAACACAGTTTGT\n+GCCAAAGCTCTACCTTTGGTTCAGTGGTGTAGCTCAGTTTGAAGCTCTGTCTGTGTTGTT\n+TCTGCTTGGAGTTTGTATATTCTCCTGTGGGTTTGAGTGAGTTTCTTCAGACAGTGTGGA\n+GGCAGGCAGGTCAAGTGAATTGGGAATTTTAAGAGGGATACACACAGTCTCTATTGCAAT\n+ACACAATAATGTCAACTAGGAATAATTTGAAATTTTGGGAATTACACCTTATTGTTTTCA\n+TGTGGAGAGTTAAATGAGAAGGTTGATATAATTTGTATGTTGGATAGCTTTGTTTATTAT\n+CCTTTTTTCCTTTAAATAAAAAGCTAGAGCCAGTGTCCAATTAGCTTGTCTTAGCATTAA\n+GACTGAAAACAGGTGGAACAAACTAGCCTGGTTTTGTCCAAAGCTTAAAAATACACCTTT\n+GGGATTAAACAAATGACAAACAACATGCTAATTAATGAGCTTAGAGATGCTGATAGGATT\n+CTATTTTATTTACTTTTCTACTTTATAGTGAGCCAAGCTAGCTGTTTCCTTTTGCTTCCA\n+GTCTTTAGTCTGAGCCAGTTGTCTCCTGGCACCATAGTTAACAGATAGAAATAGAACCAA\n+TTTCGATCTTCTCATCTAACTGTTGGCAAGAAAGCAAATAATTGCATTTCCCAAAACGTT\n+GAGCTACTCTTTAAACATGTACTTTTCAAAAGACCAATTCCACTATGTAAAGATCTCTCT\n+GTTTGCAGAGTCTCCTCCAGAGAGGACAGGACGCCGACGCAGTATGCCAGGCAGCTCCTC\n+TGACAAGACCACACCCGCCATGGAGGCCACGTCCACTGCTGCCACACCTTTTAGAGTCAC\n+CGTGAGTACTGTGAGTGTGTTCTTCTGTACTGCCTCTGTCTTCTCTATTTGTTTTACCCT\n+CTGGCTTTCTCTTTGTATCCACCTTAGTTTGCCTGAGCAGGCTGTTAGTTATATATCAGT\n+GTCGACAGAATCCTGGTCTGGTGTCCAGATGGACCCATGCCAATCTGAAACTCGTTTACT\n+TCAAATATTGGAATGGGACCTTTGATGTTTGGCGTCTGCACATCATGCATCTTGGGCTTA\n+TGTTCAGCACAGTATCCTCCATTGACTTTTCACATCCGGTGTGATTTCACATTGCATTTC\n+ACGCTGAATTATGTTCACGTGCTTCAAGCAAGCTAACACACACACACACACACTTCCACA\n+CCTGTGCACACACACAACGTCGTCACTCACTAACTTCTAAGCACACTGTCTCTCCTCGTC\n+TCTGTCAAACATGCACGCACATGCAGCAGGCCTTTGTCTGTCATCTTGCTCTAATTCAAA\n+ACCAGTATGCTTTCTGCCATGTTTAATTCAACAGATAAACAGCCAGTTAATGAAGCAAAA\n+AATTCTGTTATGAGTCATCAATTTAAAGCTAATTAGCAGTGCATATTCCCATTAATAAAT\n+AATGAGTGGGGAGATGACGACCCAGAGGTGAACTGTAAACAGTAGATGTTAAGCCAGCAG\n+GGCCAGGGACATGCAGCACTCAGTCTCTCATAAACAATCCTCCAACTTCATGTAAACTTT\n+CTGCTTTTTGAAATTACACTAATGGGCCAAGTTAAGTGCTAAAACACATTATATTACTAT\n+AATACTAAACTATACTCTGAAAATAGAAAAGATATTCTTATTTCTTTCAGTTCCTCCTTT\n+TTGATTCCTTTTTTTAATCACTTCAGCACTCGGTTTCGCTAAAAGATCGTGTTCAGTCTC\n+AAAAACCCCAAAAAACCCAAAGTGGGATGCCTCCAAGGCTTAGTAAAAGCTCACAGTAAG\n+TAAAAAAAACAAAAGTAGGCTAGACCCACTGTTATTGGACCACCAGCTGAGTGAGAATAG\n+AGTCTTTCACTGAACTGAAACAGTTGTAACTTTATTTTTGGAGTAACACATATAAATTAC\n+CACAGCTTGATGATGCCAAACTCTCATCTGTTCATATAAAAAAGTGTAAATGATGTTTCC\n+GGGGGAATGGTTACCCGCTGTGTGTGTGTGACTGCATGCATTTTTGTGTCTCTCTCTGAC\n+TGATTTATTCCAATTTAAATTTGTTTTTCATAGGGATGTGAATTTAGTCACCGAGCAGTG\n+TTTTTTTTTACATGACTAGGAATGAATGAGTAGATATATAGAGAGAGATGTAAAAAAGAA\n+AAGAAGAACGGAAAGCTAGTAGGAGGCACATAGGGTCAGATGGAAGGGCTAAATATTGAT\n+TAAGTGTCTCTTAAGCAGCTCCTCGTACTCTCCGGGGAAGAGAGAGCGAAGAGGAACACT\n+GCAGCAAAGTCATCCTGTCTCAATCACATGACCACTTCACTTACTTCTGTGGGCTTATTG\n+CTAAGCAGCACTTCTTGCACAAAGATTCCTCAGACAGTGTTTGACCCTCTCCTGCACTTT\n+TCCTCATACTGCCCCCTTCTGGCCTCTGATTGTAGCACAGCTAACTTTTTGATCTGTTGG\n+GTTCCGTTGAATACAAACAAATAAACTAATAAGATTTGACTTAAATAGAGTTGATTTTCA\n+GCTTAAATTGTTTAATTTTAAGGACAACAAGTAAAAAATGTGTAAGGACACCAGTATGAT\n+TTTGCAGATCTATCAAATTCTGAGTATAGATAGTACTGTAGAAAGACACAATACAGTATA\n+TGGATGGATGGACAGAGGAAAAGGATGCAGGCATGGTGGCACACACAAATGTTGGAATGA\n+AAACAGGAAGACAAGTAGGCAGGCACTCGTTTTCTCCTCCTTCTCTCCTGCATCTCCCAC\n+TTTTAGCAATGACAAACCACCCCTCACTTTTCTCCCTCCAGTGAAAAGAGTTGTGGTGAC\n' |
b |
diff -r 000000000000 -r 95ea8d97abb4 test-data/output1.bed12 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output1.bed12 Fri Jan 11 18:15:21 2019 -0500 |
b |
@@ -0,0 +1,2 @@ +track name=Spaln description="NP_001121846.1" useScore=1 +scaffold_1 233 29800 NP_001121846.1 1000 + 233 29800 255,0,0 43 31,30,125,9,9,106,4,9,5,37,8,18,12,18,9,4,30,18,8,3,2,3,15,6,10,7,5,7,14,2,11,20,12,12,2,19,23,26,5,7,9,23,5, 0,71,184,1922,2587,6911,7425,7504,7626,8016,8114,8185,8347,8632,8746,9149,9725,15480,15549,15615,16511,16714,16848,17115,17191,18118,18504,19271,19365,19443,20377,22213,22440,25892,25951,26121,26227,26308,26406,28178,28715,28868,29562 |
b |
diff -r 000000000000 -r 95ea8d97abb4 test-data/output1.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output1.tabular Fri Jan 11 18:15:21 2019 -0500 |
b |
@@ -0,0 +1,45 @@ +# rID gID %id ExonL MisMch Unpair ref_l ref_r tgt_l tgt_r eScore IntrnL iScore Sig3/I Sig5/T # - X P DiNuc +NP_001121846.1 scaffold_1 30.00 31 7 0 1 10 234 264 71.9 0 0.0 67.90 -1.80 0 0 0 0 . +NP_001121846.1 scaffold_1 16.67 30 6 9 11 27 305 334 -9.0 40 -8.2 9.90 -2.20 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 64.29 125 15 0 28 69 418 542 226.4 83 8.4 22.20 16.00 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 66.67 9 1 0 70 72 2156 2164 37.9 1613 -6.6 4.40 21.90 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 66.67 9 1 0 73 75 2821 2829 32.3 656 7.5 7.20 12.10 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 62.86 106 13 0 76 110 7145 7250 176.6 4315 4.0 25.10 25.30 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 0.00 4 2 0 111 112 7659 7662 22.9 408 11.8 5.70 17.50 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 0.00 9 2 1 113 114 7738 7746 4.9 75 20.0 13.50 2.90 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 0.00 5 1 0 115 115 7860 7864 24.0 113 -3.9 7.30 16.20 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 30.00 37 7 0 116 125 8250 8286 15.8 385 9.7 12.50 11.50 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 100.00 8 0 0 126 127 8348 8355 28.3 61 18.0 16.20 -0.80 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 33.33 18 4 0 128 133 8419 8436 26.2 63 1.5 12.10 6.70 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 0.00 12 4 0 134 137 8581 8592 29.2 144 9.9 18.20 9.20 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 0.00 18 6 0 138 143 8866 8883 29.1 273 5.7 14.00 24.90 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 0.00 9 3 0 144 146 8980 8988 28.2 96 33.9 21.70 10.20 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 50.00 4 1 0 147 148 9383 9386 33.7 394 -5.5 3.40 14.10 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 10.00 30 5 4 149 154 9959 9988 21.1 572 3.1 10.30 20.60 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 16.67 18 5 0 155 160 15714 15731 43.6 5725 3.9 18.20 22.40 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 50.00 8 1 0 161 162 15783 15790 19.0 51 8.8 -3.20 17.10 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 0.00 3 1 0 163 163 15849 15851 17.0 58 20.8 13.40 3.40 0 0 0 1 GC.AG +NP_001121846.1 scaffold_1 0.00 2 1 0 164 164 16745 16746 20.9 893 -5.3 14.60 8.20 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 0.00 3 1 0 165 165 16948 16950 27.2 201 14.2 22.30 9.10 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 100.00 15 0 0 166 166 17082 17096 13.3 131 17.9 23.40 2.50 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 0.00 6 1 1 167 167 17349 17354 28.3 252 -9.3 5.30 22.50 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 33.33 10 2 0 168 170 17425 17434 15.0 70 22.3 10.10 2.30 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 33.33 7 2 0 171 173 18352 18358 24.7 917 -18.2 2.90 16.40 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 100.00 5 0 0 174 174 18738 18742 17.0 379 19.5 12.40 0.60 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 66.67 7 1 0 175 177 19505 19511 32.6 762 -14.2 7.60 16.10 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 0.00 14 4 0 178 181 19599 19612 16.1 87 15.0 1.90 18.00 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 0.00 2 1 0 182 182 19677 19678 17.1 64 18.2 10.00 3.60 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 50.00 11 1 0 183 184 20611 20621 30.0 932 -2.8 17.10 15.00 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 33.33 20 2 2 185 188 22447 22466 27.3 1825 -5.3 7.50 15.80 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 50.00 12 2 0 189 192 22674 22685 31.9 207 4.4 5.00 7.70 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 20.00 12 3 1 193 197 26126 26137 31.8 3440 -1.3 22.70 14.00 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 0.00 2 1 0 198 198 26185 26186 22.5 47 14.8 12.40 8.30 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 33.33 19 4 0 199 204 26355 26373 33.1 168 7.8 15.10 7.10 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 0.00 23 3 0 205 207 26461 26483 8.0 87 11.9 16.80 8.10 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 33.33 26 2 4 208 212 26542 26567 22.6 58 18.9 20.50 -0.50 0 0 0 0 GT.AG +NP_001121846.1 scaffold_1 0.00 5 1 0 213 213 26640 26644 24.6 72 3.9 14.90 11.30 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 33.33 7 2 0 214 216 28412 28418 28.0 1767 -4.5 11.80 12.30 0 0 0 1 GT.AG +NP_001121846.1 scaffold_1 100.00 9 0 0 217 217 28949 28957 26.9 530 17.1 25.30 10.30 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 28.57 23 2 3 218 221 29102 29124 36.1 144 16.5 21.20 10.60 0 0 0 2 GT.AG +NP_001121846.1 scaffold_1 0.00 5 1 1 222 222 29796 29800 24.4 671 8.0 19.10 10.60 0 0 0 1 GT.AG +@ scaffold_1 + ( 234 29800 ) NP_001121846.1 222 ( 1 222 ) S: 1357.3 =: 38.1 C: 110.8 T#: 122 T-: 26 B#: 0 B-: 0 X: 0 Pam: 0 |
b |
diff -r 000000000000 -r 95ea8d97abb4 test-data/output1_gff_genes.gff3 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output1_gff_genes.gff3 Fri Jan 11 18:15:21 2019 -0500 |
b |
@@ -0,0 +1,47 @@ +##gff-version 3 +##sequence-region scaffold_1 1 59940 +scaffold_1 ALN gene 234 29800 1357 + . ID=gene00001;Name=scaffold_1_15 +scaffold_1 ALN mRNA 234 29800 1357 + . ID=mRNA00001;Parent=gene00001;Name=scaffold_1_15 +scaffold_1 ALN cds 234 264 71 + 0 ID=cds00001;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 1 10 + +scaffold_1 ALN cds 305 334 -9 + 2 ID=cds00002;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 11 27 + +scaffold_1 ALN cds 418 542 226 + 2 ID=cds00003;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 28 69 + +scaffold_1 ALN cds 2156 2164 37 + 0 ID=cds00004;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 70 72 + +scaffold_1 ALN cds 2821 2829 32 + 0 ID=cds00005;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 73 75 + +scaffold_1 ALN cds 7145 7250 176 + 0 ID=cds00006;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 76 110 + +scaffold_1 ALN cds 7659 7662 22 + 2 ID=cds00007;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 111 112 + +scaffold_1 ALN cds 7738 7746 4 + 1 ID=cds00008;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 113 114 + +scaffold_1 ALN cds 7860 7864 24 + 1 ID=cds00009;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 115 115 + +scaffold_1 ALN cds 8250 8286 15 + 2 ID=cds00010;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 116 125 + +scaffold_1 ALN cds 8348 8355 28 + 1 ID=cds00011;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 126 127 + +scaffold_1 ALN cds 8419 8436 26 + 2 ID=cds00012;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 128 133 + +scaffold_1 ALN cds 8581 8592 29 + 2 ID=cds00013;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 134 137 + +scaffold_1 ALN cds 8866 8883 29 + 2 ID=cds00014;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 138 143 + +scaffold_1 ALN cds 8980 8988 28 + 2 ID=cds00015;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 144 146 + +scaffold_1 ALN cds 9383 9386 33 + 2 ID=cds00016;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 147 148 + +scaffold_1 ALN cds 9959 9988 21 + 1 ID=cds00017;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 149 154 + +scaffold_1 ALN cds 15714 15731 43 + 1 ID=cds00018;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 155 160 + +scaffold_1 ALN cds 15783 15790 19 + 1 ID=cds00019;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 161 162 + +scaffold_1 ALN cds 15849 15851 17 + 2 ID=cds00020;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 163 163 + +scaffold_1 ALN cds 16745 16746 20 + 2 ID=cds00021;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 164 164 + +scaffold_1 ALN cds 16948 16950 27 + 0 ID=cds00022;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 165 165 + +scaffold_1 ALN cds 17082 17096 13 + 0 ID=cds00023;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 166 166 + +scaffold_1 ALN cds 17349 17354 28 + 0 ID=cds00024;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 167 167 + +scaffold_1 ALN cds 17425 17434 15 + 0 ID=cds00025;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 168 170 + +scaffold_1 ALN cds 18352 18358 24 + 2 ID=cds00026;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 171 173 + +scaffold_1 ALN cds 18738 18742 17 + 1 ID=cds00027;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 174 174 + +scaffold_1 ALN cds 19505 19511 32 + 2 ID=cds00028;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 175 177 + +scaffold_1 ALN cds 19599 19612 16 + 1 ID=cds00029;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 178 181 + +scaffold_1 ALN cds 19677 19678 17 + 2 ID=cds00030;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 182 182 + +scaffold_1 ALN cds 20611 20621 30 + 0 ID=cds00031;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 183 184 + +scaffold_1 ALN cds 22447 22466 27 + 1 ID=cds00032;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 185 188 + +scaffold_1 ALN cds 22674 22685 31 + 2 ID=cds00033;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 189 192 + +scaffold_1 ALN cds 26126 26137 31 + 2 ID=cds00034;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 193 197 + +scaffold_1 ALN cds 26185 26186 22 + 2 ID=cds00035;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 198 198 + +scaffold_1 ALN cds 26355 26373 33 + 0 ID=cds00036;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 199 204 + +scaffold_1 ALN cds 26461 26483 8 + 2 ID=cds00037;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 205 207 + +scaffold_1 ALN cds 26542 26567 22 + 0 ID=cds00038;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 208 212 + +scaffold_1 ALN cds 26640 26644 24 + 1 ID=cds00039;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 213 213 + +scaffold_1 ALN cds 28412 28418 28 + 2 ID=cds00040;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 214 216 + +scaffold_1 ALN cds 28949 28957 26 + 1 ID=cds00041;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 217 217 + +scaffold_1 ALN cds 29102 29124 36 + 1 ID=cds00042;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 218 221 + +scaffold_1 ALN cds 29796 29800 24 + 2 ID=cds00043;Parent=mRNA00001;Name=scaffold_1_15;Target=NP_001121846.1 222 222 + |
b |
diff -r 000000000000 -r 95ea8d97abb4 test-data/output1_gff_matches.gff3 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output1_gff_matches.gff3 Fri Jan 11 18:15:21 2019 -0500 |
b |
@@ -0,0 +1,45 @@ +##gff-version 3 +##sequence-region scaffold_1 1 59940 +scaffold_1 ALN nucleotide_to_protein_match 234 264 71 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 1 10 +;Gap=M10 +scaffold_1 ALN nucleotide_to_protein_match 305 334 -9 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 11 27 +;Gap=M2 D1 M5 I8 M2 +scaffold_1 ALN nucleotide_to_protein_match 418 542 226 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 28 69 +;Gap=M42 +scaffold_1 ALN nucleotide_to_protein_match 2156 2164 37 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 70 72 +;Gap=M3 +scaffold_1 ALN nucleotide_to_protein_match 2821 2829 32 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 73 75 +;Gap=M3 +scaffold_1 ALN nucleotide_to_protein_match 7145 7250 176 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 76 110 +;Gap=M35 +scaffold_1 ALN nucleotide_to_protein_match 7659 7662 22 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 111 112 +;Gap=M2 +scaffold_1 ALN nucleotide_to_protein_match 7738 7746 4 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 113 114 +;Gap=D1 M2 +scaffold_1 ALN nucleotide_to_protein_match 7860 7864 24 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 115 115 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 8250 8286 15 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 116 125 +;Gap=M10 D3 +scaffold_1 ALN nucleotide_to_protein_match 8348 8355 28 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 126 127 +;Gap=M2 +scaffold_1 ALN nucleotide_to_protein_match 8419 8436 26 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 128 133 +;Gap=M6 +scaffold_1 ALN nucleotide_to_protein_match 8581 8592 29 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 134 137 +;Gap=M4 +scaffold_1 ALN nucleotide_to_protein_match 8866 8883 29 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 138 143 +;Gap=M6 +scaffold_1 ALN nucleotide_to_protein_match 8980 8988 28 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 144 146 +;Gap=M3 +scaffold_1 ALN nucleotide_to_protein_match 9383 9386 33 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 147 148 +;Gap=M2 +scaffold_1 ALN nucleotide_to_protein_match 9959 9988 21 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 149 154 +;Gap=D4 M6 +scaffold_1 ALN nucleotide_to_protein_match 15714 15731 43 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 155 160 +;Gap=M6 +scaffold_1 ALN nucleotide_to_protein_match 15783 15790 19 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 161 162 +;Gap=M2 +scaffold_1 ALN nucleotide_to_protein_match 15849 15851 17 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 163 163 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 16745 16746 20 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 164 164 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 16948 16950 27 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 165 165 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 17082 17096 13 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 166 166 +;Gap=M1 D4 +scaffold_1 ALN nucleotide_to_protein_match 17349 17354 28 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 167 167 +;Gap=D1 M1 +scaffold_1 ALN nucleotide_to_protein_match 17425 17434 15 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 168 170 +;Gap=M3 +scaffold_1 ALN nucleotide_to_protein_match 18352 18358 24 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 171 173 +;Gap=M3 +scaffold_1 ALN nucleotide_to_protein_match 18738 18742 17 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 174 174 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 19505 19511 32 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 175 177 +;Gap=M3 +scaffold_1 ALN nucleotide_to_protein_match 19599 19612 16 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 178 181 +;Gap=M4 +scaffold_1 ALN nucleotide_to_protein_match 19677 19678 17 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 182 182 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 20611 20621 30 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 183 184 +;Gap=M2 D2 +scaffold_1 ALN nucleotide_to_protein_match 22447 22466 27 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 185 188 +;Gap=D2 M4 +scaffold_1 ALN nucleotide_to_protein_match 22674 22685 31 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 189 192 +;Gap=M4 +scaffold_1 ALN nucleotide_to_protein_match 26126 26137 31 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 193 197 +;Gap=I1 M4 +scaffold_1 ALN nucleotide_to_protein_match 26185 26186 22 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 198 198 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 26355 26373 33 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 199 204 +;Gap=M6 +scaffold_1 ALN nucleotide_to_protein_match 26461 26483 8 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 205 207 +;Gap=M3 D5 +scaffold_1 ALN nucleotide_to_protein_match 26542 26567 22 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 208 212 +;Gap=D4 M5 +scaffold_1 ALN nucleotide_to_protein_match 26640 26644 24 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 213 213 +;Gap=M1 +scaffold_1 ALN nucleotide_to_protein_match 28412 28418 28 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 214 216 +;Gap=M3 +scaffold_1 ALN nucleotide_to_protein_match 28949 28957 26 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 217 217 +;Gap=M1 D2 +scaffold_1 ALN nucleotide_to_protein_match 29102 29124 36 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 218 221 +;Gap=D3 M4 +scaffold_1 ALN nucleotide_to_protein_match 29796 29800 24 + . ID=match00001;Name=scaffold_1_15;Target=NP_001121846.1 222 222 +;Gap=M1 D1 |
b |
diff -r 000000000000 -r 95ea8d97abb4 test-data/query.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/query.fasta Fri Jan 11 18:15:21 2019 -0500 |
[ |
@@ -0,0 +1,6 @@ +>NP_001121846.1 uncharacterized protein LOC100148058 [Danio rerio] +MQRRRNTMENPLFCSSPNQHHGWIQVSDMRSPPGHWMSCGHSCAEHAVWNPKFCVVTDYQMLLLDKEEIH +PLLLQEKRTDSSKSRLLRRTISVPVETHFPGFQSHLSVDNNERASGAGEGRREDEGFLQFFTVINKRIFQ +SFSLSHFWPMGTACMSALTEGDSLIIRPKTKDCVFACSHLTECLVARISLYYLSSFRVFACKKLSRLVSR +VTLSLQKPMRTV + |