annotate commons/tools/srptPhyML.py @ 31:0ab839023fe4

Uploaded
author m-zytnicki
date Tue, 30 Apr 2013 14:33:21 -0400
parents 94ab73e8a190
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
18
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
1 #!/usr/bin/env python
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
2
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
3 import user, os, sys, getopt, exceptions, logging, ConfigParser
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
4
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
5 if not os.environ.has_key( "REPET_PATH" ):
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
6 print "*** Error: no environment variable REPET_PATH"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
7 sys.exit(1)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
8 sys.path.append( os.environ["REPET_PATH"] )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
9
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
10 import pyRepet.sql.RepetJobMySQL
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
11 import pyRepet.launcher.Launcher
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
12
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
13 #-----------------------------------------------------------------------------
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
14
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
15 def help():
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
16
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
17 """
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
18 Give the list of the command-line options.
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
19 """
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
20
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
21 print
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
22 print "usage:",sys.argv[0]," [ options ]"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
23 print "options:"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
24 print " -h: this help"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
25 print " -g: name of the group identifier (same for all the jobs)"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
26 print " -q: name of the query directory"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
27 print " -S: suffix in the query directory (default='*.fa')"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
28 print " -Q: name of the queue (on the cluster)"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
29 print " -d: absolute path to the temporary directory"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
30 print " -C: configuration file from TEdenovo or TEannot pipeline"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
31 print " -t: job table name (default=jobs)"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
32 print " -p: absolute path to project directory (if jobs management via files)"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
33 print " -c: clean (remove job launch files and job stdout)"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
34 print " -v: verbose (default=0/1/2)"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
35 print
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
36
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
37 #-----------------------------------------------------------------------------
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
38
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
39 def main():
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
40
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
41 """
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
42 This program takes a directory as input and launches MAP on each file in it.
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
43 """
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
44
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
45 groupid = ""
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
46 queryDir = ""
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
47 patternSuffix = "*.fa"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
48 queue = ""
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
49 tmpDir = ""
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
50 configFileName = ""
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
51 jobTable = "jobs"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
52 projectDir = ""
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
53 clean = False
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
54 verbose = 0
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
55
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
56 try:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
57 opts, args = getopt.getopt(sys.argv[1:],"hg:q:S:Q:d:C:t:p:cv:")
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
58 except getopt.GetoptError, err:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
59 print str(err)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
60 help()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
61 sys.exit(1)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
62 for o,a in opts:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
63 if o == "-h":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
64 help()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
65 sys.exit(0)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
66 elif o == "-g":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
67 groupid = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
68 elif o == "-q":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
69 queryDir = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
70 elif o == "-S":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
71 patternSuffix = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
72 elif o == "-Q":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
73 queue = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
74 elif o == "-d":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
75 tmpDir = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
76 elif o == "-C":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
77 configFileName = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
78 elif o == "-t":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
79 jobTable = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
80 elif o == "-p":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
81 projectDir = a
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
82 elif o == "-c":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
83 clean = True
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
84 elif o == "-v":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
85 verbose = int(a)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
86
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
87 if groupid == "" or queryDir == "":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
88 print "*** Error: missing compulsory options"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
89 help()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
90 sys.exit(1)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
91
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
92 if os.environ["REPET_JOBS"] == "files" and projectDir == "":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
93 print "*** Error: missing compulsory options for jobs management via files"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
94 help()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
95 sys.exit(1)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
96
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
97 if verbose > 0:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
98 print "\nbeginning of %s" % (sys.argv[0].split("/")[-1])
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
99 sys.stdout.flush()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
100
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
101 #--------------------------------------------------------------------------
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
102
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
103 # create the 'log' file
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
104
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
105 logFileName = "%s_pid%s.log" % ( groupid, os.getpid() )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
106 handler = logging.FileHandler( logFileName )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
107 formatter = logging.Formatter( "%(asctime)s %(levelname)s: %(message)s" )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
108 handler.setFormatter( formatter )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
109 logging.getLogger('').addHandler( handler )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
110 logging.getLogger('').setLevel( logging.DEBUG )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
111 logging.info( "started" )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
112
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
113
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
114 # open a connection to the MySQL table
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
115
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
116 if configFileName != "":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
117 if not os.path.exists( configFileName ):
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
118 print "*** Error: configuration file '%s' doesn't exist" % ( configFileName )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
119 sys.exit(1)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
120 config = ConfigParser.ConfigParser()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
121 config.readfp( open(configFileName) )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
122 host = config.get("repet_env","repet_host")
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
123 user = config.get("repet_env","repet_user")
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
124 passwd = config.get("repet_env","repet_pw")
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
125 dbname = config.get("repet_env","repet_db")
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
126 else:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
127 host = os.environ["REPET_HOST"]
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
128 user = os.environ["REPET_USER"]
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
129 passwd = os.environ["REPET_PW"]
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
130 dbname = os.environ["REPET_DB"]
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
131
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
132 if os.environ["REPET_JOBS"] == "files":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
133 jobdb = pyRepet.sql.RepetJobMySQL.RepetJob( dbname = projectDir + "/" + os.environ["REPET_DB"] )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
134 elif os.environ["REPET_JOBS"] == "MySQL":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
135 jobdb = pyRepet.sql.RepetJobMySQL.RepetJob( user, host, passwd, dbname )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
136 else:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
137 print "*** Error: REPET_JOBS is '%s'" % ( os.environ["REPET_JOBS"] )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
138 sys.exit(1)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
139
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
140
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
141 currentDir = os.getcwd()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
142 if tmpDir == "":
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
143 tmpDir = currentDir
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
144
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
145 # launch PhyML on each fasta file in queryDir
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
146 cL = pyRepet.launcher.Launcher.PhyMlLauncher( jobdb=jobdb, query=queryDir, cdir=currentDir, tmpdir=tmpDir, job_table=jobTable, queue=queue, groupid=groupid, acro="PhyML" )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
147 cL.run( patternSuffix )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
148
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
149 # clean
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
150 if clean == True:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
151 cL.clean()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
152
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
153
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
154 logging.info( "finished" )
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
155
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
156 if verbose > 0:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
157 print "%s finished successfully\n" % (sys.argv[0].split("/")[-1])
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
158 sys.stdout.flush()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
159
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
160 return 0
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
161
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
162 #----------------------------------------------------------------------------
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
163
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
164 if __name__ == '__main__':
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
165 main()