# HG changeset patch # User iuc # Date 1600854585 0 # Node ID cd5a82a16bbfc5c4d57b4544a88d213e2858bbc5 # Parent f6007bce569df3557635bb03a41b43cd3abcc624 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/ncbi_entrez_eutils commit dae34e5e182b4cceb808d7353080f14aa9a78ca9" diff -r f6007bce569d -r cd5a82a16bbf __efetch_build_options.py --- a/__efetch_build_options.py Wed Mar 11 04:02:55 2020 -0400 +++ b/__efetch_build_options.py Wed Sep 23 09:49:45 2020 +0000 @@ -53,7 +53,7 @@ sra structure taxonomy -unigene'''.replace( "", "").replace( "", "").split("\n") +unigene'''.replace("", "").replace("", "").split("\n") help = ''' (all) diff -r f6007bce569d -r cd5a82a16bbf ecitmatch.py --- a/ecitmatch.py Wed Mar 11 04:02:55 2020 -0400 +++ b/ecitmatch.py Wed Sep 23 09:49:45 2020 +0000 @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse @@ -17,6 +16,8 @@ parser.add_argument('--first_page', nargs='*', help='First Page') parser.add_argument('--author_name', nargs='*', help='Author name') + parser.add_argument('--version', action='version', version=eutils.Client.getVersion(), help='Version (reports Biopython version)') + # Emails parser.add_argument('--user_email', help="User email") parser.add_argument('--admin_email', help="Admin email") diff -r f6007bce569d -r cd5a82a16bbf efetch.py --- a/efetch.py Wed Mar 11 04:02:55 2020 -0400 +++ b/efetch.py Wed Sep 23 09:49:45 2020 +0000 @@ -1,36 +1,111 @@ #!/usr/bin/env python + import argparse +import glob +import json +import logging +import os + import eutils +logging.basicConfig(level=logging.INFO) + + +def handleEfetchException(e, db, payload): + logging.error('No results returned. This could either be due to no records matching the supplied IDs for the query database or it could be an error due to invalid parameters. The reported exception was "%s".\n\nPayload used for the efetch query to database "%s"\n\n%s', e, db, json.dumps(payload, indent=4)) + + # Create a file in the downloads folder so that the user can access run information + current_directory = os.getcwd() + final_directory = os.path.join(current_directory, r'downloads') + if not os.path.exists(final_directory): + os.makedirs(final_directory) + + print('The following files were downloaded:') + print(os.listdir(final_directory)) + + file_path = os.path.join('downloads', 'no_results.txt') + with open(file_path, 'w') as handle: + handle.write('No results') + + +def localFetch(db, gformat, newname, **payload): + problem = None + try: + c.fetch(db, **payload) + + for chunk, file in enumerate(glob.glob('downloads/EFetch *')): + os.rename(file, '%s%s.%s' % (newname, chunk + 1, gformat)) + + except Exception as e: + problem = e + handleEfetchException(e, db, payload) + else: + print('The following files were downloaded:') + print(os.listdir('downloads')) + + return problem + + if __name__ == '__main__': parser = argparse.ArgumentParser(description='EFetch', epilog='') parser.add_argument('db', help='Database to use') parser.add_argument('--user_email', help="User email") parser.add_argument('--admin_email', help="Admin email") + parser.add_argument('--version', action='version', version=eutils.Client.getVersion(), help='Version (reports Biopython version)') + # ID source + parser.add_argument('--id_json', help='list of ids in a json file as returned by esearch or elink') + parser.add_argument('--id_xml', help='list of ids in an xml file as returned by esearch or elink') parser.add_argument('--id_list', help='list of ids') parser.add_argument('--id', help='Comma separated individual IDs') - parser.add_argument('--history_file', help='Fetch results from previous query') + parser.add_argument('--history_file', help='Fetch results from previous query (JSON)') + parser.add_argument('--history_xml', help='Fetch results from previous query (XML)') # Output parser.add_argument('--retmode', help='Retmode') parser.add_argument('--rettype', help='Rettype') + parser.add_argument('--galaxy_format', help='Galaxy format') args = parser.parse_args() c = eutils.Client(history_file=args.history_file, user_email=args.user_email, admin_email=args.admin_email) - merged_ids = c.parse_ids(args.id_list, args.id, args.history_file) payload = {} - if args.history_file is not None: - payload.update(c.get_history()) - else: - payload['id'] = ','.join(merged_ids) - for attr in ('retmode', 'rettype'): if getattr(args, attr, None) is not None: payload[attr] = getattr(args, attr) - c.fetch(args.db, ftype=args.retmode, **payload) + if args.history_file is not None or args.history_xml is not None: + if args.history_file is not None: + input_histories = c.get_histories() + else: + input_histories = c.extract_histories_from_xml_file(args.history_xml) + + problem = None + for hist in input_histories: + qkey = hist['query_key'] + tmp_payload = payload + tmp_payload.update(hist) + newname = 'downloads/EFetch-%s-%s-querykey%s-chunk' % (args.rettype, args.retmode, qkey) + problem = localFetch(args.db, args.galaxy_format, newname, **tmp_payload) + + if os.path.exists('downloads'): + os.rename('downloads', 'downloads-qkey%s' % (qkey)) + + if not os.path.exists('downloads'): + os.makedirs('downloads') + + for relpath in glob.glob('downloads-qkey*/*'): + file = os.path.basename(relpath) + os.rename(relpath, 'downloads/%s' % (file)) + + if problem is not None: + raise(problem) + + else: + merged_ids = c.parse_ids(args.id_list, args.id, args.history_file, args.id_xml, args.id_json) + payload['id'] = ','.join(merged_ids) + newname = 'downloads/EFetch-%s-%s-chunk' % (args.rettype, args.retmode) + localFetch(args.db, args.galaxy_format, newname, **payload) diff -r f6007bce569d -r cd5a82a16bbf egquery.py --- a/egquery.py Wed Mar 11 04:02:55 2020 -0400 +++ b/egquery.py Wed Sep 23 09:49:45 2020 +0000 @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse @@ -9,9 +8,12 @@ if __name__ == '__main__': parser = argparse.ArgumentParser(description='EGQuery', epilog='') parser.add_argument('term', help='Query') - # + parser.add_argument('--user_email', help="User email") parser.add_argument('--admin_email', help="Admin email") + + parser.add_argument('--version', action='version', version=eutils.Client.getVersion(), help='Version (reports Biopython version)') + args = parser.parse_args() c = eutils.Client(user_email=args.user_email, admin_email=args.admin_email) diff -r f6007bce569d -r cd5a82a16bbf einfo.py --- a/einfo.py Wed Mar 11 04:02:55 2020 -0400 +++ b/einfo.py Wed Sep 23 09:49:45 2020 +0000 @@ -1,5 +1,4 @@ #!/usr/bin/env python -from __future__ import print_function import argparse @@ -11,6 +10,7 @@ parser.add_argument('--db', help='Database to use') parser.add_argument('--user_email', help="User email") parser.add_argument('--admin_email', help="Admin email") + parser.add_argument('--version', action='version', version=eutils.Client.getVersion(), help='Version (reports Biopython version)') args = parser.parse_args() c = eutils.Client(user_email=args.user_email, admin_email=args.admin_email) diff -r f6007bce569d -r cd5a82a16bbf einfo.xml --- a/einfo.xml Wed Mar 11 04:02:55 2020 -0400 +++ b/einfo.xml Wed Sep 23 09:49:45 2020 +0000 @@ -7,22 +7,46 @@ python einfo.py --version $default -@EMAIL_ARGUMENTS@ -> $default]]> + ]]> - + + + + + + + + + + + + - + + + + + + + macros.xml + +#Note, this script uses einfo.py to get database info. It also uses manually compiled data stored at the bottom of this script that is based on: https://www.ncbi.nlm.nih.gov/books/NBK25499/table/chapter4.T._valid_values_of__retmode_and/?report=objectonly +#The data in the table on that page was manipulated to replace nulls with 'none', remove duplicates, and add missing formats based on correspondence with MLN. + +## +## use einfo to retrieve all the valid databases +## + +print STDERR "Retrieving database list\n"; + +my $dbxml = `python einfo.py --user_email "planemo@galaxyproject.org" --admin_email "planemo@galaxyproject.org;test@bx.psu.edu"`; + +my(@dblist); +my $dbs = {}; +my $dbfroms = {}; +my $dbnames = {}; +foreach(split(/\n/,$dbxml)) + { + if(/(.+)<\/DbName>/) + { + my $db = $1; + push(@dblist,$db); + $dbs->{$db} = 0; + $dbfroms->{$db} = 0; + $dbnames->{$db} = $_; + } + } + +## +## Use einfo to retrieve all the valid links for each database (Note: some databases are not linked) +## + +my $h = {}; +foreach my $db (sort {$dbnames->{$a} cmp $dbnames->{$b}} @dblist) + { + sleep(2); + + print STDERR "Retrieving info for $db\n"; + + my $response = `python einfo.py --db $db --user_email "planemo\@galaxyproject.org" --admin_email "planemo\@galaxyproject.org;test\@bx.psu.edu"`; + + my $dolinks = 0; + my $link = ""; + my $name = ""; + + foreach(split(/\n/,$response)) + { + if(//) + { + $dolinks = 1; + #Save whether there exist links from this database + $dbfroms->{$db} = 1; + } + elsif(!$dolinks) + { + if(/(.+)<\/MenuName>/) + {$dbnames->{$db} = "$1 ($db)"} + } + elsif($dolinks) + { + if(/(.+)<\/Name>/) + {$link=$1} + elsif(/(.*)<\/Menu>/) + {$name=$1} + elsif(/(.+)<\/DbTo>/) + { + $dbto=$1; + push(@{$h->{$db}->{$dbto}},[$link,$name]); + $link=""; + $name=""; + } + } + } + } + +my @sorted_dblist = sort {$dbnames->{$a} cmp $dbnames->{$b}} @dblist; + +## +## Generate XML to govern the valid databases to use with efetch +## + +my $efetch_dbhash = {}; #->{efetch-compatible-db}->{rettype-retmode-galaxy_format} = format_name (galaxy_format) +while() + { + chomp; + my($db,$galaxy_format,$retmode,$rettype,$format_name) = split(/\t/,$_); + $efetch_dbhash->{$db}->{"$rettype-$retmode-$galaxy_format"} = + "$format_name ($galaxy_format)"; + } + +#EFetch database select list + +print << 'EOXML'; + + +EOXML + +foreach my $db (grep {exists($dbs->{$_})} + sort {$dbnames->{$a} cmp $dbnames->{$b}} + keys(%$efetch_dbhash)) + { + my $selected = ''; + if($db eq 'pubmed') + {$selected = ' selected="True"'} + print << " EOXML"; + + EOXML + } + +print << 'EOXML'; + + +EOXML + +#EFetch output formats + +print << 'EOXML'; + + + +EOXML + +foreach my $db (grep {exists($dbs->{$_})} + sort {$dbnames->{$a} cmp $dbnames->{$b}} + keys(%$efetch_dbhash)) + { + print << " EOXML"; + + + EOXML + + foreach my $eutils_format (sort {$efetch_dbhash->{$db}->{$a} cmp + $efetch_dbhash->{$db}->{$b}} + keys(%{$efetch_dbhash->{$db}})) + { + print << " EOXML"; + + EOXML + } + + print << " EOXML"; + + + EOXML + } + +print << 'EOXML'; + + +EOXML + +## +## Create a select list for the databases linked *from* +## + +print << 'EOXML'; + + +EOXML + +foreach my $from (@sorted_dblist) + { + print << " EOXML"; + + EOXML + } + +print << 'EOXML'; + + +EOXML + +## +## Create a select list for the databases linked *to* +## + +print << 'EOXML'; + + +EOXML + +foreach my $from (grep {$dbfroms->{$_}} @sorted_dblist) + { + print << " EOXML"; + + EOXML + } + +print << 'EOXML'; + + +EOXML + +## +## Create empty entries for commands that take no *to* database or link +## + +print << 'EOXML'; + + + + + + + + + + + + + + + +EOXML + +foreach(grep {$dbfroms->{$_}} @sorted_dblist) + { + print << " EOXML"; + + + + EOXML + } + +print << 'EOXML'; + + +EOXML + +## +## This is the master macro for the command selection +## + +print << 'EOXML'; + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +EOXML + +## +## Create selections for valid links for command types neighbor, neighbor_history, and neighbor_score +## + +print << 'EOXML'; + + + +EOXML + +foreach my $from (grep {$dbfroms->{$_}} @sorted_dblist) + { + print STDERR ("Creating Links From: $from\n"); + + print << " EOXML"; + + + + EOXML + + my @dbtos = (grep {exists($h->{$from}) && exists($h->{$from}->{$_})} + @sorted_dblist); + foreach(@dbtos) + { + print << " EOXML"; + + EOXML + } + if(scalar(@dbtos) == 0) + { + #Provide an option for a self-link: from->from + print << " EOXML"; + + EOXML + } + + print << ' EOXML'; + + EOXML + + if(exists($h->{$from})) + { + #There do exist links to invalid(/outdated/non-existant) databases that + #would result in an error if they are selected, so we use the original + #@dblist instead of the keys present in the sub hash of $h->{$from}, and + #then check for existence in the sub-hash + foreach my $to (grep {exists($h->{$from}->{$_})} @sorted_dblist) + { + print STDERR ("\tTo: $to Links: ", + join(',',map {$_->[0]} @{$h->{$from}->{$to}}), + "\n"); + + print << " EOXML"; + + + + EOXML + + foreach(sort {"$a->[1] ($a->[0])" cmp "$b->[1] ($b->[0])"} + @{$h->{$from}->{$to}}) + { + print << " EOXML"; + + EOXML + } + + print << " EOXML"; + + + EOXML + + } + } + else + { + ## + ## Add-on selections for self-links for command types neighbor, + ## neighbor_history, and neighbor_score + ## Note, I'm not sure this would yield a valid result from elink + ## + + #This shows $from, but this is the 'when' for db_to conditional + print << " EOXML"; + + + + + + EOXML + } + + print << ' EOXML'; + + + EOXML + } + +## +## Add-on selections for self-links for command types neighbor, +## neighbor_history, and neighbor_score +## Note, I'm not sure this would yield a valid result from elink +## + +foreach my $from (grep {!exists($h->{$_})} @sorted_dblist) + { + print << "EOXML"; + + + + + + + + + + + + +EOXML + } + +## +## This is the corresponding code for using the selections to add the respective command line options +## + +print << 'EOXML'; + + +EOXML + +print << 'EOXML'; + + + +EOXML + +sub startXML + { + print << ' EOXML'; + + + 18.01 + 1.70 + +--user_email "$__user_email__" +#set admin_emails = ';'.join(str($__admin_users__).split(',')) +--admin_email "$admin_emails" + + + + `__ + +The `full disclaimer `__ is available on +their website + +Liability +~~~~~~~~~ + +For documents and software available from this server, the +U.S. Government does not warrant or assume any legal liability or +responsibility for the accuracy, completeness, or usefulness of any +information, apparatus, product, or process disclosed. + +Endorsement +~~~~~~~~~~~ + +NCBI does not endorse or recommend any commercial +products, processes, or services. The views and opinions of authors +expressed on NCBI's Web sites do not necessarily state or reflect those +of the U.S. Government, and they may not be used for advertising or +product endorsement purposes. + +External Links +~~~~~~~~~~~~~~ + +Some NCBI Web pages may provide links to other Internet +sites for the convenience of users. NCBI is not responsible for the +availability or content of these external sites, nor does NCBI endorse, +warrant, or guarantee the products, services, or information described +or offered at these other Internet sites. Users cannot assume that the +external sites will abide by the same Privacy Policy to which NCBI +adheres. It is the responsibility of the user to examine the copyright +and licensing restrictions of linked pages and to secure all necessary +permissions. + ]]> + +#if $query_source.qss == "history_json": + --history_file $query_source.history_file +#else if $query_source.qss == "history_xml": + --history_xml $query_source.history_xml +#else if $query_source.qss == "id_file": + --id_list $query_source.id_file +#else if $query_source.qss == "id_list": + --id $query_source.id_list +#else if $query_source.qss == "id_xml": + --id_xml $query_source.id_xml +#else if $query_source.qss == "id_json": + --id_json $query_source.id_json +#end if + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + @Book{ncbiEutils, + author = {Eric Sayers}, + title = {Entrez Programming Utilities Help}, + year = {2010}, + publisher = {National Center for Biotechnology Information, Bethesda, Maryland}, + note = {https://www.ncbi.nlm.nih.gov/books/NBK25500/} + } + + + + + biopython + + + + + + EOXML + } + +sub endXML + { + print << ' EOXML'; + + EOXML + } + +BEGIN {startXML()} +END {endXML()} + + +## +## Output formats for efetch mapped to galaxy formats +## + +#Based on: +#https://www.ncbi.nlm.nih.gov/books/NBK25499/table/chapter4.T._valid_values_of__retmode_and/?report=objectonly + +#Note: While json works for esearch and elink, the only database that supports +#json (according to an NLM support ticket I have about this) is snp + +#The output_format param value for these will be "rettype-retmode-format" + +#db galaxy retmode rettype format_name +__DATA__ +bioproject tabular text uilist List of UIDs +bioproject xml xml docsum Document summary +bioproject xml xml uilist List of UIDs +bioproject xml xml xml Full record +biosample tabular text uilist List of UIDs +biosample txt text full Full record +biosample xml xml docsum Document summary +biosample xml xml full Full record +biosample xml xml uilist List of UIDs +biosystems tabular text uilist List of UIDs +biosystems xml xml docsum Document summary +biosystems xml xml uilist List of UIDs +biosystems xml xml xml Full record +clinvar tabular text uilist List of UIDs +clinvar xml xml clinvarset ClinVar Set +clinvar xml xml docsum Document summary +clinvar xml xml uilist List of UIDs +clinvar xml none none Full +gds tabular text uilist List of UIDs +gds txt text summary Summary +gds xml xml docsum Document summary +gds xml xml uilist List of UIDs +gds xml none none Full +gene txt text gene_table Gene table +gene tabular text uilist List of UIDs +gene txt asn.1 none text ASN.1 +gene xml xml docsum Document summary +gene xml xml none Full +gene xml xml uilist List of UIDs +gtr tabular text uilist List of UIDs +gtr xml xml docsum Document summary +gtr xml xml gtracc GTR Test Report +gtr xml xml uilist List of UIDs +gtr xml none none Full +homologene fasta text fasta FASTA +homologene tabular text alignmentscores Alignment scores +homologene tabular text uilist List of UIDs +homologene txt asn.1 none text ASN.1 +homologene txt text homologene HomoloGene +homologene xml xml docsum Document summary +homologene xml xml none Full +homologene xml xml uilist List of UIDs +mesh tabular text uilist List of UIDs +mesh txt text full Full record +mesh xml xml docsum Document summary +mesh xml xml uilist List of UIDs +nlmcatalog tabular text uilist List of UIDs +nlmcatalog txt text none Full record +nlmcatalog xml xml docsum Document summary +nlmcatalog xml xml none Full +nlmcatalog xml xml uilist List of UIDs +nuccore binary asn.1 none binary ASN.1 +nuccore fasta text fasta FASTA +nuccore fasta text fasta_cds_aa CDS protein FASTA +nuccore fasta text fasta_cds_na CDS nucleotide FASTA +nuccore genbank text gb GenBank flat file +nuccore genbank text gbwithparts GenBank flat file with full sequence (contigs) +nuccore tabular text acc Accession number(s) +nuccore txt text ft Feature table +nuccore tabular text seqid SeqID string +nuccore tabular text uilist List of UIDs +nuccore txt text none text ASN.1 +nuccore xml xml docsum Document summary +nuccore xml xml fasta TinySeq +nuccore xml xml gb GBSeq +nuccore xml xml gbc INSDSeq +nuccore xml xml native Full record +nuccore xml xml uilist List of UIDs +nucest binary asn.1 none binary ASN.1 +nucest fasta text fasta FASTA +nucest genbank text gb GenBank flat file +nucest tabular text acc Accession number(s) +nucest tabular text seqid SeqID string +nucest tabular text uilist List of UIDs +nucest txt text est EST report +nucest txt text none text ASN.1 +nucest xml xml docsum Document summary +nucest xml xml fasta TinySeq +nucest xml xml gb GBSeq +nucest xml xml gbc INSDSeq +nucest xml xml native Full record +nucest xml xml uilist List of UIDs +nucgss binary asn.1 none binary ASN.1 +nucgss fasta text fasta FASTA +nucgss genbank text gb GenBank flat file +nucgss tabular text acc Accession number(s) +nucgss tabular text seqid SeqID string +nucgss tabular text uilist List of UIDs +nucgss txt text gss GSS report +nucgss txt text none text ASN.1 +nucgss xml xml docsum Document summary +nucgss xml xml fasta TinySeq +nucgss xml xml gb GBSeq +nucgss xml xml gbc INSDSeq +nucgss xml xml native Full record +nucgss xml xml uilist List of UIDs +pmc tabular text uilist List of UIDs +pmc txt text medline MEDLINE +pmc xml xml docsum Document summary +pmc xml xml none FULL +pmc xml xml uilist List of UIDs +popset binary asn.1 none binary ASN.1 +popset fasta text fasta FASTA +popset genbank text gb GenBank flat file +popset tabular text acc Accession number(s) +popset tabular text seqid SeqID string +popset tabular text uilist List of UIDs +popset txt text none text ASN.1 +popset xml xml docsum Document summary +popset xml xml fasta TinySeq +popset xml xml gb GBSeq +popset xml xml gbc INSDSeq +popset xml xml native Full record +popset xml xml uilist List of UIDs +protein binary asn.1 none binary ASN.1 +protein fasta text fasta FASTA +protein tabular text acc Accession number(s) +protein txt text ft Feature table +protein tabular text seqid SeqID string +protein tabular text uilist List of UIDs +protein txt text gp GenPept flat file +protein txt text none text ASN.1 +protein xml xml docsum Document summary +protein xml xml fasta TinySeq +protein xml xml gp GBSeq +protein xml xml gpc INSDSeq +protein xml xml ipg Identical Protein +protein xml xml native Full record +protein xml xml uilist List of UIDs +pubmed tabular text uilist List of UIDs +pubmed txt asn.1 none text ASN.1 +pubmed txt text abstract Abstract +pubmed txt text medline MEDLINE +pubmed xml xml docsum Document summary +pubmed xml xml none Full +pubmed xml xml uilist List of UIDs +sequences fasta text fasta FASTA +sequences tabular text acc Accession number(s) +sequences tabular text seqid SeqID string +sequences tabular text uilist List of UIDs +sequences txt text none text ASN.1 +sequences xml xml docsum Document summary +sequences xml xml uilist List of UIDs +sequences xml none none Full +snp fasta text fasta FASTA +snp json json docsum Document summary +snp json json uilist List of UIDs +snp tabular text ssexemplar SS Exemplar list +snp tabular text uilist List of UIDs +snp txt asn.1 none text ASN.1 +snp txt text chr Chromosome report +snp txt text docset Summary +snp txt text flt Flat file +snp txt text rsr RS Cluster report +snp xml xml docsum Document summary +snp xml xml none XML +snp xml xml uilist List of UIDs +sra tabular text uilist List of UIDs +sra xml xml docsum Document summary +sra xml xml full Full +taxonomy tabular text uilist List of UIDs +taxonomy xml xml none Full +taxonomy xml xml docsum Document summary +taxonomy xml xml uilist List of UIDs diff -r f6007bce569d -r cd5a82a16bbf macros.xml --- a/macros.xml Wed Mar 11 04:02:55 2020 -0400 +++ b/macros.xml Wed Sep 23 09:49:45 2020 +0000 @@ -1,7 +1,7 @@ 18.01 - 1.3 + 1.70 --user_email "$__user_email__" #set admin_emails = ';'.join(str($__admin_users__).split(',')) @@ -86,743 +86,51 @@ and licensing restrictions of linked pages and to secure all necessary permissions. ]]> - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -#if $query_source.qss == "history": +#if $query_source.qss == "history_json": --history_file $query_source.history_file +#else if $query_source.qss == "history_xml": + --history_xml $query_source.history_xml #else if $query_source.qss == "id_file": --id_list $query_source.id_file #else if $query_source.qss == "id_list": --id $query_source.id_list +#else if $query_source.qss == "id_xml": + --id_xml $query_source.id_xml +#else if $query_source.qss == "id_json": + --id_json $query_source.id_json #end if - + - - - - + + + + + + + - - + + + + + - + + + + + + + - + - - - - - @Book{ncbiEutils, @@ -836,12 +144,4400 @@ + python biopython - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff -r f6007bce569d -r cd5a82a16bbf test-data/efetchin.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/efetchin.tabular Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,2 @@ +1899688395 +1896832511 diff -r f6007bce569d -r cd5a82a16bbf test-data/einfo.dblist.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/einfo.dblist.xml Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,52 @@ + + + + + + pubmed + protein + nuccore + ipg + nucleotide + structure + sparcle + genome + annotinfo + assembly + bioproject + biosample + blastdbinfo + books + cdd + clinvar + gap + gapplus + grasp + dbvar + gene + gds + geoprofiles + homologene + medgen + mesh + ncbisearch + nlmcatalog + omim + orgtrack + pmc + popset + proteinclusters + pcassay + biosystems + pccompound + pcsubstance + seqannot + snp + sra + taxonomy + biocollections + gtr + + + + diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.elinkin_1link.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.elinkin_1link.json Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,23 @@ +{ + "header": { + "type": "elink", + "version": "0.3" + }, + "linksets": [ + { + "dbfrom": "gene", + "ids": [ + "118502329" + ], + "linksetdbs": [ + { + "dbto": "nuccore", + "linkname": "gene_nuccore_refseqrna", + "links": [ + "1899688395" + ] + } + ] + } + ] +} diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.elinkin_1link_hist.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.elinkin_1link_hist.json Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,22 @@ +{ + "header": { + "type": "elink", + "version": "0.3" + }, + "linksets": [ + { + "dbfrom": "nuccore", + "ids": [ + "1899688395" + ], + "linksetdbhistories": [ + { + "dbto": "gene", + "linkname": "nuccore_gene", + "querykey": "1" + } + ], + "webenv": "MCID_5f60d98126049170ce66fe2e" + } + ] +} diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.elinkin_1link_id.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.elinkin_1link_id.tabular Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,1 @@ +118502329 diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.elinkin_allalllinks_id.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.elinkin_allalllinks_id.xml Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,18 @@ + + + + + nuccore + + 1899688395 + 1896832511 + + + gene + nuccore_gene + 1 + + MCID_5f60e00e98743c5c3572195e + + + diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.elinkin_alllinks_id.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.elinkin_alllinks_id.xml Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,44 @@ + + + + + + gene + + 118502329 + + + nuccore + gene_nuccore + + + 1899688395 + + + 1896832511 + + + + + + nuccore + gene_nuccore_pos + + + 1896832511 + + + + + + nuccore + gene_nuccore_refseqrna + + + 1899688395 + + + + + + diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.esearch_in_xmlid.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.esearch_in_xmlid.xml Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,6 @@ + + +110 +118502329 + 118502329[UID] UID -1 N GROUP 118502329[UID] + diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.esearch_in_xmlid_1link.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.esearch_in_xmlid_1link.tabular Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,2 @@ +1899688395 +1896832511 diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.esearchin_id.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.esearchin_id.json Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,25 @@ +{ + "header": { + "type": "esearch", + "version": "0.3" + }, + "esearchresult": { + "count": "1", + "retmax": "1", + "retstart": "0", + "idlist": [ + "118502329" + ], + "translationset": [], + "translationstack": [ + { + "term": "118502329[UID]", + "field": "UID", + "count": "-1", + "explode": "N" + }, + "GROUP" + ], + "querytranslation": "118502329[UID]" + } +} diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.esearchin_id.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.esearchin_id.tabular Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,1 @@ +118502329 diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.esearchin_id_1link.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.esearchin_id_1link.xml Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,21 @@ + + + + + + gene + + 118502329 + + + nuccore + gene_nuccore_refseqrna + + + 1899688395 + + + + + + diff -r f6007bce569d -r cd5a82a16bbf test-data/elink.esearchin_id_alllinks.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/elink.esearchin_id_alllinks.json Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,38 @@ +{ + "header": { + "type": "elink", + "version": "0.3" + }, + "linksets": [ + { + "dbfrom": "gene", + "ids": [ + "118502329" + ], + "linksetdbs": [ + { + "dbto": "nuccore", + "linkname": "gene_nuccore", + "links": [ + "1899688395", + "1896832511" + ] + }, + { + "dbto": "nuccore", + "linkname": "gene_nuccore_pos", + "links": [ + "1896832511" + ] + }, + { + "dbto": "nuccore", + "linkname": "gene_nuccore_refseqrna", + "links": [ + "1899688395" + ] + } + ] + } + ] +} diff -r f6007bce569d -r cd5a82a16bbf test-data/esearch.gene.hist.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/esearch.gene.hist.json Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,27 @@ +{ + "header": { + "type": "esearch", + "version": "0.3" + }, + "esearchresult": { + "count": "1", + "retmax": "1", + "retstart": "0", + "querykey": "1", + "webenv": "MCID_5f5fd696d2dc7951442b7849", + "idlist": [ + "118502329" + ], + "translationset": [], + "translationstack": [ + { + "term": "118502329[UID]", + "field": "UID", + "count": "-1", + "explode": "N" + }, + "GROUP" + ], + "querytranslation": "118502329[UID]" + } +} diff -r f6007bce569d -r cd5a82a16bbf test-data/esearch.gene.hist.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/esearch.gene.hist.xml Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,6 @@ + + +1101MCID_5f5fd690407bc55fc76bad4e +118502329 + 118502329[UID] UID -1 N GROUP 118502329[UID] + diff -r f6007bce569d -r cd5a82a16bbf test-data/esearch.gene.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/esearch.gene.json Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,25 @@ +{ + "header": { + "type": "esearch", + "version": "0.3" + }, + "esearchresult": { + "count": "1", + "retmax": "1", + "retstart": "0", + "idlist": [ + "118502329" + ], + "translationset": [], + "translationstack": [ + { + "term": "118502329[UID]", + "field": "UID", + "count": "-1", + "explode": "N" + }, + "GROUP" + ], + "querytranslation": "118502329[UID]" + } +} diff -r f6007bce569d -r cd5a82a16bbf test-data/esearch.gene.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/esearch.gene.tabular Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,22 @@ +106632260 +100008587 +106632264 +106631781 +109910382 +109910381 +109910380 +109910379 +109864282 +109864281 +109864280 +109864279 +109864274 +109864273 +109864272 +109864271 +106631777 +100861532 +100169758 +100169768 +100169767 +100169766 diff -r f6007bce569d -r cd5a82a16bbf test-data/esearch.gene.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/esearch.gene.xml Wed Sep 23 09:49:45 2020 +0000 @@ -0,0 +1,6 @@ + + +110 +118502329 + 118502329[UID] UID -1 N GROUP 118502329[UID] +