# HG changeset patch # User caleb-easterly # Date 1498229929 14400 # Node ID d61a95fe20e4dfb10a1487d00240947f76856bbb # Parent 0f08a4a0dd159b30d6e0da1126c1768454b5cd03 planemo upload commit 833e8a1d5ef37cbd4cadad6c90a51b268871627b-dirty diff -r 0f08a4a0dd15 -r d61a95fe20e4 validateFASTA.xml --- a/validateFASTA.xml Fri Jun 23 10:49:25 2017 -0400 +++ b/validateFASTA.xml Fri Jun 23 10:58:49 2017 -0400 @@ -1,4 +1,4 @@ - + diff -r 0f08a4a0dd15 -r d61a95fe20e4 validate_fasta_headers.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/validate_fasta_headers.xml Fri Jun 23 10:58:49 2017 -0400 @@ -0,0 +1,64 @@ + + + + + + + + + + + + + + + + + + + + + + + +sw|" or ">SW|") + * NCBI (starts with ">gi|" or ">GI|") + * Halobacterium from Max Planck (starts with "OE") + * H Influenza, from Novartis (starts with ">hflu_") + * C Trachomatis (starts with ">C.tr\_" or "C\_trachomatis\_") + * M Tuberculosis (starts with ">M. tub") + * Saccharomyces Genome Database (contains "SGDID") + * Genome translation (ex. ">dm345\_3L-sense [2343534-234353938]") + * Genome Annotation Framework for Flexible Analysis (GAFFA) (starts with ">GAFFA") + * UPS (contains "\_HUMAN\_UPS") + +Many sequences are reported as Generic, which may or may not allow for extraction of the accession number. +]]> + + + + @misc{fastaValidation, + author = {The GalaxyP Team}, + date = {22 June 2017}, + title = {FASTA Database Validation Tool} + } + + +