Mercurial > repos > iss > eurl_vtec_wgs_pt
annotate scripts/ReMatCh/modules/seqFromWebTaxon.py @ 1:444b0421bbdc draft
"planemo upload commit c8533b93fb2816db37887244489cbd6e919fc155"
| author | iss | 
|---|---|
| date | Tue, 22 Mar 2022 08:39:10 +0000 | 
| parents | c6bab5103a14 | 
| children | 
| rev | line source | 
|---|---|
| 0 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 1 #!/usr/bin/env python3 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 2 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 3 # -*- coding: utf-8 -*- | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 4 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 5 ''' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 6 Adapted from: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 7 https://github.com/mickaelsilva/pythonscripts/blob/master/SeqOfWeb/SeqFromWebTaxon.py | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 8 mickaelsilva | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 9 ''' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 10 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 11 import sys | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 12 import urllib.request | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 13 import urllib.parse | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 14 import xml.etree.ElementTree as ET | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 15 import time | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 16 import argparse | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 17 import os | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 18 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 19 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 20 def run_seq_from_web_taxon(taxonname, outputfile, getmachine, getOmicsDataType, getLibraryType, print_True): | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 21 print('\n' + 'Searching RunIDs for ' + taxonname) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 22 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 23 taxonname = urllib.parse.quote(taxonname) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 24 url = "http://www.ebi.ac.uk/ena/data/view/Taxon%3A" + taxonname + "&display=xml" | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 25 try: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 26 content = urllib.request.urlopen(url) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 27 xml = content.read() | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 28 tree = ET.fromstring(xml) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 29 taxonid = '' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 30 except: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 31 print("Ooops!There might be a problem with the ena service, try later or check if the xml is well formated" | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 32 " at " + url) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 33 raise | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 34 for child in tree: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 35 taxonid = child.get('taxId') | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 36 if (taxonid): | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 37 print("\n" + "Taxon ID found: " + taxonid) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 38 url = "http://www.ebi.ac.uk/ena/data/warehouse/search?query=%22tax_tree%28" + \ | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 39 taxonid + \ | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 40 "%29%22&result=read_run&display=xml" | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 41 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 42 content = urllib.request.urlopen(url) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 43 xml = content.read() | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 44 tree = ET.fromstring(xml) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 45 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 46 runid = '' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 47 n = 0 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 48 with open(outputfile, "wt") as f: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 49 f.write('#' + str(time.strftime("%d/%m/%Y")) + "\n") | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 50 model = '' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 51 prjid = '' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 52 length_line = 0 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 53 omics = '' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 54 libraryType = '' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 55 for child in tree: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 56 runid = child.get('accession') | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 57 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 58 n += 1 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 59 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 60 if getmachine is True or getOmicsDataType is True or getLibraryType is True: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 61 for child2 in child: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 62 if child2.tag == 'EXPERIMENT_REF': | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 63 expid = child2.get('accession') | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 64 url2 = "http://www.ebi.ac.uk/ena/data/view/" + expid + "&display=xml" | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 65 content = urllib.request.urlopen(url2) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 66 xml = content.read() | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 67 tree2 = ET.fromstring(xml) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 68 try: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 69 for child3 in tree2: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 70 for child4 in child3: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 71 if child4.tag == 'PLATFORM': | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 72 for child5 in child4: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 73 for child6 in child5: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 74 if child6.tag == 'INSTRUMENT_MODEL': | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 75 model = child6.text | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 76 elif child4.tag == 'STUDY_REF': | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 77 prjid = child4.get('accession') | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 78 elif child4.tag == 'DESIGN': | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 79 if getOmicsDataType is True or getLibraryType is True: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 80 for child5 in child4: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 81 if child5.tag == 'LIBRARY_DESCRIPTOR': | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 82 for child6 in child5: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 83 if child6.tag == 'LIBRARY_SOURCE' and getOmicsDataType is True: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 84 omics = child6.text | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 85 elif child6.tag == 'LIBRARY_LAYOUT' and getLibraryType is True: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 86 libraryType = child6[0].tag | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 87 except: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 88 model = 'not found' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 89 omics = 'not found' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 90 libraryType = 'not found' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 91 f.write(str(runid) + "\t" + model + "\t" + prjid + "\t" + omics + "\t" + libraryType + "\n") | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 92 if print_True: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 93 line = "run acession %s sequenced on %s from project %s for %s %s end" \ | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 94 " data" % (runid, model, prjid, omics, libraryType) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 95 if length_line < len(line): | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 96 length_line = len(line) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 97 sys.stderr.write("\r" + line + str(' ' * (length_line - len(line)))) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 98 sys.stderr.flush() | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 99 else: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 100 f.write(str(runid) + '\t' * 4 + "\n") | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 101 if print_True: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 102 line = "run acession %s" % (runid, prjid) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 103 if length_line < len(line): | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 104 length_line = len(line) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 105 sys.stderr.write("\r" + line + str(' ' * (length_line - len(line)))) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 106 sys.stderr.flush() | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 107 print("\n") | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 108 print("\n" | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 109 "found %s run id's" % n) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 110 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 111 else: | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 112 print("taxon name does not exist") | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 113 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 114 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 115 def main(): | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 116 parser = argparse.ArgumentParser(description="This program gets a list of sequencing runs and machine were the" | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 117 " sequencing was performed, given a taxon name accepted by the" | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 118 " European nucleotide Archive") | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 119 parser.add_argument('-i', nargs=1, type=str, help='taxon name', metavar='"Streptococcus agalactiae"', required=True) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 120 parser.add_argument('-o', nargs=1, type=str, help='output file name', required=True) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 121 parser.add_argument('-g', help='True to include sequencing machine in the output', action='store_true', | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 122 required=False) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 123 parser.add_argument('--getOmicsDataType', help='Informs the programme to include OMICS data type' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 124 ' (examples: GENOMIC / TRANSCRIPTOMIC / SYNTHETIC) in the output', | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 125 action='store_true') | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 126 parser.add_argument('--getLibraryType', help='Informs the programme to include library type' | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 127 ' (examples: PAIRED / SINGLE) in the output', action='store_true') | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 128 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 129 args = parser.parse_args() | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 130 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 131 getmachine = args.g | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 132 taxonname = args.i[0] | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 133 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 134 outdir = os.path.dirname(os.path.abspath(args.o[0])) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 135 if not os.path.isdir(outdir): | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 136 os.makedirs(outdir) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 137 outputfile = os.path.abspath(args.o[0]) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 138 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 139 getOmicsDataType = args.getOmicsDataType | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 140 getLibraryType = args.getLibraryType | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 141 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 142 run_seq_from_web_taxon(taxonname, outputfile, getmachine, getOmicsDataType, getLibraryType, True) | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 143 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 144 | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 145 if __name__ == "__main__": | 
| 
c6bab5103a14
"planemo upload commit 6abf3e299d82d07e6c3cf8642bdea80e96df64c3-dirty"
 iss parents: diff
changeset | 146 main() | 
