annotate TEiso/GFFToBed_Wrapper.py @ 4:e59fb2fcb65e draft

Uploaded
author urgi-team
date Tue, 19 Jul 2016 10:58:14 -0400
parents 15d6811e6bf5
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
1 #!/usr/bin/env python
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
2
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
3
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
4 import subprocess, tempfile, sys, os, glob, shutil, time
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
5 from optparse import OptionParser
1
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
6 #from commons.core.utils.RepetOptionParser import RepetOptionParser
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
7
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
8
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
9 class GFFToBedWrapper(object):
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
10
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
11 def __init__(self):
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
12 self._options = None
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
13
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
14
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
15 def stop_err(self, msg ):
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
16 sys.stderr.write( "%s\n" % msg )
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
17 sys.exit()
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
18
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
19
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
20 def setAttributesFromCmdLine(self):
1
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
21 ## self._toolVersion = "1.0"
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
22 description = "GFFToBed version"
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
23 epilog = "\n parses a GFF3 file and create a bed file. \n"
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
24 epilog += "example: GFFToBed.py -i <inputFile> -o <outputFile>\n"
1
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
25 #parser = RepetOptionParser(description = description, epilog = epilog, version = self._toolVersion)
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
26 parser = OptionParser(description = description, version = "1.0")
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
27 parser.add_option("-i", "--inputFile", dest = "inputFile", action = "store", type = "string", help = "Input GFF3 File name.", default = "")
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
28 parser.add_option("-o", "--outputFile", dest = "outputFile", action = "store", type = "string", help = "output Bed File name", default = "")
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
29 parser.add_option("-v", "--verbosity", dest = "verbosity", action = "store", type = "int", help = "Verbosity [optional] [default: 3]",default = 3)
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
30 options = parser.parse_args()[0]
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
31 self._setAttributesFromOptions(options)
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
32
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
33 def _setAttributesFromOptions(self, options):
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
34 self._options = options
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
35
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
36 def run(self):
1
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
37 tmp = "%s_tmp" % ((os.path.splitext(self._options.outputFile)[0]))
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
38 prg = "GFFToBed.py"
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
39 args = ""
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
40 args += "-i %s" % self._options.inputFile
1
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
41 args += " "
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
42 args += "-o %s" % tmp
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
43 cmd = "%s %s" %(prg, args)
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
44 print cmd
1
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
45
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
46 try:
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
47 tmp_err = tempfile.NamedTemporaryFile().name
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
48 tmp_stderr = open( tmp_err, 'wb' )
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
49 proc = subprocess.Popen( args=cmd, shell=True, cwd=".", stderr=tmp_stderr )
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
50 returncode = proc.wait()
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
51 tmp_stderr.close()
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
52 # get stderr, allowing for case where it's very large
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
53 tmp_stderr = open( tmp_err, 'rb' )
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
54 stderr = ''
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
55 buffsize = 1048576
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
56 try:
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
57 while True:
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
58 stderr += tmp_stderr.read( buffsize )
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
59 if not stderr or len( stderr ) % buffsize != 0:
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
60 break
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
61 except OverflowError:
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
62 pass
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
63 tmp_stderr.close()
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
64 if stderr:
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
65 raise Exception, stderr
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
66 except Exception, e:
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
67 self.stop_err( 'Error in GFFToBed:\n' + str( e ) )
1
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
68
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
69
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
70 try:
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
71 cmdsort= "bedtools sort -i %s > %s" % (tmp, self._options.outputFile)
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
72 os.system(cmdsort)
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
73 except Exception, e:
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
74 self.stop_err( 'Error in bedtools sort:\n' + str( e ) )
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
75
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
76
15d6811e6bf5 Uploaded
urgi-team
parents: 0
diff changeset
77
0
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
78 if __name__ == "__main__":
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
79 iWrapper = GFFToBedWrapper()
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
80 iWrapper.setAttributesFromCmdLine()
3d22562b4489 Uploaded
urgi-team
parents:
diff changeset
81 iWrapper.run()