comparison spp_wrapper.py @ 0:1c5611e52fd0 draft

Uploaded spp_wrapper
author modencode-dcc
date Thu, 17 Jan 2013 14:36:18 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:1c5611e52fd0
1 #purpose: python wrapper to run spp
2 #author: Ziru Zhou
3 #Date: November 2012
4
5 import sys, subprocess, tempfile, shutil, glob, os, os.path, gzip
6 from galaxy import eggs
7 import pkg_resources
8 pkg_resources.require( "simplejson" )
9 import simplejson
10
11 CHUNK_SIZE = 1024
12
13 def main():
14 options = simplejson.load( open( sys.argv[1] ) )
15 output_narrow_peak = sys.argv[2]
16 output_region_peak = sys.argv[3]
17 output_peakshift_file = sys.argv[4]
18 output_rdata_file = sys.argv[5]
19 output_plot_file = sys.argv[6]
20 output_default_file = sys.argv[7]
21
22 #set file extensions and set mandatory options
23 #========================================================================================
24 experiment_name = '_'.join( options['experiment_name'].split() ) #save experiment name
25
26 chip_file = "%s.bam" % (options['chip_file'])
27 subprocess.call(["cp", options['chip_file'], chip_file])
28
29 cmdline = "Rscript /mnt/galaxyTools/galaxy-central/tools/modENCODE_DCC_tools/spp/run_spp.R -c=%s" % ( chip_file )
30 if 'input_file' in options:
31 input_file = "%s.bam" % (options['input_file'])
32 subprocess.call(["cp", options['input_file'], input_file])
33 cmdline = "%s -i=%s" % ( cmdline, input_file )
34
35 #test = "%s_VS_%s.narrowPeak.gz" %(chip_name, input_name)
36 #print test
37 #set additional options
38 #========================================================================================
39 if (options['action'] == "cross_correlation"):
40 cmdline = "%s %s %s %s > default_output.txt" % ( cmdline, options['savp'], options['out'], options['rf'] )
41 elif (options['action'] == "peak_calling"):
42 cmdline = "%s -fdr=%s -npeak=%s %s %s %s %s %s > default_output.txt" % ( cmdline, options['fdr'], options['npeak'], options['savr'], options['savd'], options['savn'], options['savp'], options['rf'] )
43 elif (options['action'] == "idr"):
44 cmdline = "%s -npeak=%s %s %s %s %s > default_output.txt" % ( cmdline, options['npeak'], options['savr'], options['savp'], options['out'], options['rf'] )
45 elif (options['action'] == "custom"):
46 cmdline = "%s -s=%s %s -x=%s -fdr=%s -npeak=%s %s %s" % ( cmdline, options['s'], options['speak'], options['x'], options['fdr'], options['npeak'], options['filtchr'], options['rf'] )
47 cmdline = "%s %s %s %s %s %s > default_output.txt" % ( cmdline, options['out'], options['savn'], options['savr'], options['savp'], options['savd'] )
48
49 #run cmdline
50 #========================================================================================
51 tmp_dir = tempfile.mkdtemp()
52 stderr_name = tempfile.NamedTemporaryFile().name
53 proc = subprocess.Popen( args=cmdline, shell=True, cwd=tmp_dir, stderr=open( stderr_name, 'wb' ) )
54 proc.wait()
55
56 #Do not terminate if error code, allow dataset (e.g. log) creation and cleanup
57 #========================================================================================
58 if proc.returncode:
59 stderr_f = open( stderr_name )
60 while True:
61 chunk = stderr_f.read( CHUNK_SIZE )
62 if not chunk:
63 stderr_f.close()
64 break
65 sys.stderr.write( chunk )
66
67
68 #determine if the outputs are there, copy them to the appropriate dir and filename
69 #========================================================================================
70 created_default_file = os.path.join( tmp_dir, "default_output.txt" )
71 if os.path.exists( created_default_file ):
72 shutil.move( created_default_file, output_default_file )
73
74 chip_name = os.path.basename(options['chip_file'])
75 input_name = os.path.basename(options['input_file'])
76 created_narrow_peak = os.path.join( "/mnt/galaxyData/files/000", "%s_VS_%s.narrowPeak.gz" % (chip_name, input_name) )
77 if os.path.exists( created_narrow_peak ):
78 shutil.move( created_narrow_peak, output_narrow_peak )
79
80 created_region_peak = os.path.join( "/mnt/galaxyData/files/000", "%s_VS_%s.regionPeak.gz" % (chip_name, input_name) )
81 if os.path.exists( created_region_peak ):
82 shutil.move( created_region_peak, output_region_peak )
83
84 created_peakshift_file = os.path.join( tmp_dir, "peakshift.txt" )
85 if os.path.exists( created_peakshift_file ):
86 shutil.move( created_peakshift_file, output_peakshift_file )
87
88 created_rdata_file = os.path.join( tmp_dir, "%s.Rdata" % options['chip_file'] )
89 if os.path.exists( created_rdata_file ):
90 shutil.move( created_rdata_file, output_rdata_file )
91
92 created_plot_file = os.path.join( tmp_dir, "%s.pdf" % options['chip_file'] )
93 if os.path.exists( created_plot_file ):
94 shutil.move( created_plot_file, output_plot_file )
95
96
97 os.unlink( stderr_name )
98 #os.rmdir( tmp_dir )
99
100 if __name__ == "__main__": main()