# HG changeset patch # User greg # Date 1588777109 14400 # Node ID df67ba6db5ded479e6fa636b052529ae4f832354 # Parent f136bf6d2f4c585a45c2a53311627e1a18db32cc Uploaded diff -r f136bf6d2f4c -r df67ba6db5de data_manager/vsnp_genbank_fetcher.xml --- a/data_manager/vsnp_genbank_fetcher.xml Mon Feb 10 10:27:08 2020 -0500 +++ b/data_manager/vsnp_genbank_fetcher.xml Wed May 06 10:58:29 2020 -0400 @@ -23,6 +23,9 @@ + + + NC_002945.4 Mycobacterium bovis AF2122/97 genome assembly, chromosome: Mycobacterium_bovis_AF2122/97 +TTGACCGATGACCCCGGTTCAGGCTTCACCACAGTGTGGAACGCGGTCGTCTCCGAACTTAACGGCGACC +CTAAGGTTGACGACGGACCCAGCAGTGATGCTAATCTCAGCGCTCCGCTGACCCCTCAGCAAAGGGCTTG +GCTCAATCTCGTCCAGCCATTGACCATCGTCGAGGGGTTTGCTCTGTTATCCGTGCCGAGCAGCTTTGTC +CAAAACGAAATCGAGCGCCATCTGCGGGCCCCGATTACCGACGCTCTCAGCCGCCGACTCGGACATCAGA +TCCAACTCGGGGTCCGCATCGCTCCGCCGGCGACCGACGAAGCCGACGACACTACCGTGCCGCCTTCCGA +AAATCCTGCTACCACATCGCCAGACACCACAACCGACAACGACGAGATTGATGACAGCGCTGCGGCACGG +GGCGATAACCAGCACAGTTGGCCAAGTTACTTCACCGAGCGCCCGCGCAATACCGATTCCGCTACCGCTG +GCGTAACCAGCCTTAACCGTCGCTACACCTTTGATACGTTCGTTATCGGCGCCTCCAACCGGTTCGCGCA +CGCCGCCGCCTTGGCGATCGCAGAAGCACCCGCCCGCGCTTACAACCCCCTGTTCATCTGGGGCGAGTCC +GGTCTCGGCAAGACACACCTGCTACACGCGGCAGGCAACTATGCCCAACGGTTGTTCCCGGGAATGCGGG diff -r f136bf6d2f4c -r df67ba6db5de test-data/all_fasta.loc --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/all_fasta.loc Wed May 06 10:58:29 2020 -0400 @@ -0,0 +1,19 @@ +#This file lists the locations and dbkeys of all the fasta files +#under the "genome" directory (a directory that contains a directory +#for each build). The script extract_fasta.py will generate the file +#all_fasta.loc. This file has the format (white space characters are +#TAB characters): +# +# +# +#So, all_fasta.loc could look something like this: +# +#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa +#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa +#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa +# +#Your all_fasta.loc file should contain an entry for each individual +#fasta file. So there will be multiple fasta files for each build, +#such as with hg19 above. +# +AF2122 AF2122 AF2122 ${__HERE__}/AF2122.fa diff -r f136bf6d2f4c -r df67ba6db5de test-data/vsnp_genbank.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/vsnp_genbank.json Wed May 06 10:58:29 2020 -0400 @@ -0,0 +1,1 @@ +{"data_tables": {"vsnp_genbank": {"description": "Genbank file for AF2122", "name": "NC_002945v4.gbk", "path": diff -r f136bf6d2f4c -r df67ba6db5de test-data/vsnp_genbank.loc --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/vsnp_genbank.loc Wed May 06 10:58:29 2020 -0400 @@ -0,0 +1,1 @@ +AF2122 NC_002945v4.gbk /private/var/folders/zf/cf4s7k3530j87w9fkhh475800000gn/T/tmpFxGvOE/tmp3MdYaQ/tmp5lwt8e/database/data_manager_tool-datanmleBG/vsnp/AF2122/genbank/NC_002945v4.gbk Genbank file for AF2122 diff -r f136bf6d2f4c -r df67ba6db5de tool-data/all_fasta.loc.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool-data/all_fasta.loc.sample Wed May 06 10:58:29 2020 -0400 @@ -0,0 +1,18 @@ +#This file lists the locations and dbkeys of all the fasta files +#under the "genome" directory (a directory that contains a directory +#for each build). The script extract_fasta.py will generate the file +#all_fasta.loc. This file has the format (white space characters are +#TAB characters): +# +# +# +#So, all_fasta.loc could look something like this: +# +#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa +#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa +#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa +# +#Your all_fasta.loc file should contain an entry for each individual +#fasta file. So there will be multiple fasta files for each build, +#such as with hg19 above. +# diff -r f136bf6d2f4c -r df67ba6db5de tool-data/vsnp_genbank.loc.sample --- a/tool-data/vsnp_genbank.loc.sample Mon Feb 10 10:27:08 2020 -0500 +++ b/tool-data/vsnp_genbank.loc.sample Wed May 06 10:58:29 2020 -0400 @@ -1,4 +1,4 @@ ## vSNP Genbank files #Value Name Path Description #AF2122 Mycobacterium_AF2122/NC_002945v4.gbk vsnp/AF2122/Mycobacterium_AF2122/NC_002945v4.gbk Genbank file for Mycobacterium bovis AF2122/97 -#NC_006932 Brucella_abortus1/NC_006932-NC_006933.gbk /vsnp/NC_006932/Brucella_abortus1/NC_006932-NC_006933.gbk Genbank file for Brucella abortus bv. 1 str. 9-941 +#NC_006932 Brucella_abortus1/NC_006932-NC_006933.gbk vsnp/NC_006932/Brucella_abortus1/NC_006932-NC_006933.gbk Genbank file for Brucella abortus bv. 1 str. 9-941 diff -r f136bf6d2f4c -r df67ba6db5de tool_data_table_conf.xml.sample --- a/tool_data_table_conf.xml.sample Mon Feb 10 10:27:08 2020 -0500 +++ b/tool_data_table_conf.xml.sample Wed May 06 10:58:29 2020 -0400 @@ -1,4 +1,10 @@ + + + value, dbkey, name, path + +
+ value, name, path, description diff -r f136bf6d2f4c -r df67ba6db5de tool_data_table_conf.xml.test --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.test Wed May 06 10:58:29 2020 -0400 @@ -0,0 +1,12 @@ + + +
+ value, dbkey, name, path + +
+ + + value, name, path, description + +
+