weightedaverage: WeightedAverage.py comparison

comparison WeightedAverage.py @ 2:efa2b391e887 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/weightedaverage commit f770c3c58f1e7e1fa5ed22d7f7aca856d36729e8

author	devteam
date	Wed, 05 Oct 2016 13:39:38 -0400
parents	90611e86a998
children

comparison

equal deleted inserted replaced

-:90611e86a998
+:efa2b391e887
 #!/usr/bin/env python
 """
 usage: %prog bed_file_1 bed_file_2 out_file
 -1, --cols1=N,N,N,N: Columns for chr, start, end, strand in first file
 -2, --cols2=N,N,N,N,N: Columns for chr, start, end, strand, name/value in second file
+-z, --allow_zeros: Include zeros in calculations
 """
 import collections
 import sys
 from galaxy.tools.util.galaxyops import *
 def GetOverlap(a, b):
 return min(a[1], b[1])-max(a[0], b[0])
+def get_float_no_zero( field ):
+rval = float( field )
+assert rval
+return rval
 options, args = doc_optparse.parse( __doc__ )
 try:
 chr_col_1, start_col_1, end_col_1, strand_col1 = parse_cols_arg( options.cols1 )
 input1, input2, input3 = args
 except Exception, eee:
 print eee
 stop_err( "Data issue: click the pencil icon in the history item to correct the metadata attributes." )
-fd2 = open(input2)
+if options.allow_zeros:
-lines2 = fd2.readlines()
+get_value = float
+else:
+get_value = get_float_no_zero
 RecombChrDict = collections.defaultdict(list)
 skipped = 0
-for line in lines2:
+for line in open( input2 ):
 temp = line.strip().split()
 try:
-assert float(temp[int(name_col_2)])
+value = get_value( temp[ name_col_2 ] )
-except:
+except Exception:
 skipped += 1
 continue
-tempIndex = [int(temp[int(start_col_2)]), int(temp[int(end_col_2)]), float(temp[int(name_col_2)])]
+tempIndex = [ int( temp[ start_col_2 ] ), int( temp[ end_col_2 ] ), value ]
-RecombChrDict[temp[int(chr_col_2)]].append(tempIndex)
+RecombChrDict[ temp[ chr_col_2 ] ].append( tempIndex )
 print "Skipped %d features with invalid values" % (skipped)
-fd1 = open(input1)
+fdd = open( input3, 'w' )
-lines = fd1.readlines()
+for line in open( input1 ):
-finalProduct = ''
+line = line.strip()
-for line in lines:
+temp = line.split('\t')
-temp = line.strip().split('\t')
+chromosome = temp[ chr_col_1 ]
-chromosome = temp[int(chr_col_1)]
+start = int( temp[ start_col_1 ] )
-start = int(temp[int(start_col_1)])
+stop = int( temp[ end_col_1 ] )
-stop = int(temp[int(end_col_1)])
 start_stop = [start, stop]
 RecombRate = FindRate( chromosome, start_stop, RecombChrDict )
 try:
 RecombRate = "%.4f" % (float(RecombRate))
 except:
 RecombRate = RecombRate
-finalProduct += line.strip()+'\t'+str(RecombRate)+'\n'
+fdd.write( "%s\t%s\n" % ( line, RecombRate ) )
-fdd = open(input3, 'w')
-fdd.writelines(finalProduct)
 fdd.close()

Mercurial > repos > devteam > weightedaverage

comparison WeightedAverage.py @ 2:efa2b391e887 draft default tip