annotate tools/metag_tools/split_paired_reads.py @ 1:cdcb0ce84a1b

Uploaded
author xuebing
date Fri, 09 Mar 2012 19:45:15 -0500
parents 9071e359b9a3
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
1 #!/usr/bin/env python
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
2
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
3 """
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
4 Split fixed length paired end reads
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
5 """
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
6
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
7 import os, sys
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
8
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
9 if __name__ == '__main__':
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
10
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
11 infile = sys.argv[1]
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
12 outfile_end1 = open(sys.argv[2], 'w')
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
13 outfile_end2 = open(sys.argv[3], 'w')
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
14
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
15 i = 0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
16
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
17 for line in file( infile ):
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
18 line = line.rstrip()
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
19
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
20 if not line:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
21 continue
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
22
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
23 end1 = ''
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
24 end2 = ''
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
25
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
26 line_index = i % 4
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
27
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
28 if line_index == 0:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
29 end1 = line + '/1'
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
30 end2 = line + '/2'
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
31
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
32 elif line_index == 1:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
33 seq_len = len(line)/2
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
34 end1 = line[0:seq_len]
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
35 end2 = line[seq_len:]
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
36
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
37 elif line_index == 2:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
38 end1 = line + '/1'
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
39 end2 = line + '/2'
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
40
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
41 else:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
42 qual_len = len(line)/2
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
43 end1 = line[0:qual_len]
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
44 end2 = line[qual_len:]
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
45
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
46 outfile_end1.write('%s\n' %(end1))
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
47 outfile_end2.write('%s\n' %(end2))
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
48
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
49 i += 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
50
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
51 if i % 4 != 0 :
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
52 sys.stderr.write("WARNING: Number of lines in the input file was not divisible by 4.\nCheck consistency of the input fastq file.\n")
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
53 outfile_end1.close()
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
54 outfile_end2.close()