annotate TEiso/CufflinksGTFToBed_Wrapper.py @ 12:22b0494ec883 draft

Uploaded
author urgi-team
date Wed, 20 Jul 2016 08:18:51 -0400
parents 782306d67e39
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
11
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
1 #!/usr/bin/env python
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
2 import subprocess, tempfile, sys, os
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
3 from optparse import OptionParser
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
4 #from commons.core.utils.RepetOptionParser import RepetOptionParser
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
5
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
6
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
7 class CufflinksGTFToBedWrapper(object):
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
8
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
9 def __init__(self):
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
10 self._options = None
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
11
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
12
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
13 def stop_err(self, msg ):
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
14 sys.stderr.write( "%s\n" % msg )
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
15 sys.exit()
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
16
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
17
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
18 def setAttributesFromCmdLine(self):
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
19 #self._toolVersion = "1.0"
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
20 description = "CufflinksGTFToBed "
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
21 epilog = "\n parses a GTF file of Cufflinks and create a bed file. \n"
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
22 epilog += "example: CufflinksGTFToBed.py -i <inputFile> -o <outputFile>\n"
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
23 #parser = RepetOptionParser(description = description, epilog = epilog, version = self._toolVersion)
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
24 parser = OptionParser(description = description, version = "1.0")
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
25 parser.add_option("-i", "--inputFile", dest = "inputFile", action = "store", type = "string", help = "Input GTF File name(transcript.gtf of Cufflinks).", default = "")
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
26 parser.add_option("-o", "--outputFile", dest = "outputFile", action = "store", type = "string", help = "output Bed File name", default = "")
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
27 parser.add_option("-v", "--verbosity", dest = "verbosity", action = "store", type = "int", help = "Verbosity [optional] [default: 3]",default = 3)
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
28 options = parser.parse_args()[0]
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
29 self._setAttributesFromOptions(options)
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
30
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
31 def _setAttributesFromOptions(self, options):
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
32 self._options = options
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
33
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
34 def run(self):
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
35 tmp = "%s_tmp" % ((os.path.splitext(self._options.outputFile)[0]))
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
36 prg = "CufflinksGTFToBed.py"
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
37 args = ""
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
38 args += "-i %s" % self._options.inputFile
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
39 args += " "
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
40 args += "-o %s" % tmp
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
41 cmd = "%s %s" %(prg, args)
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
42 print cmd
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
43
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
44 try:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
45 tmp_err = tempfile.NamedTemporaryFile().name
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
46 tmp_stderr = open( tmp_err, 'wb' )
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
47 proc = subprocess.Popen( args=cmd, shell=True, cwd=".", stderr=tmp_stderr )
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
48 returncode = proc.wait()
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
49 tmp_stderr.close()
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
50 # get stderr, allowing for case where it's very large
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
51 tmp_stderr = open( tmp_err, 'rb' )
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
52 stderr = ''
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
53 buffsize = 1048576
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
54 try:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
55 while True:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
56 stderr += tmp_stderr.read( buffsize )
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
57 if not stderr or len( stderr ) % buffsize != 0:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
58 break
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
59 except OverflowError:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
60 pass
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
61 tmp_stderr.close()
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
62 if stderr:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
63 raise Exception, stderr
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
64 except Exception, e:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
65 self.stop_err( 'Error in TranscriptToBed:\n' + str( e ) )
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
66 try:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
67 cmdsort= "bedtools sort -i %s > %s" % (tmp, self._options.outputFile)
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
68 os.system(cmdsort)
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
69 except Exception, e:
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
70 self.stop_err( 'Error in bedtools sort:\n' + str( e ) )
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
71
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
72
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
73 if __name__ == "__main__":
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
74 iWrapper = CufflinksGTFToBedWrapper()
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
75 iWrapper.setAttributesFromCmdLine()
782306d67e39 Uploaded
urgi-team
parents:
diff changeset
76 iWrapper.run()