comparison prepare_amplicon_info.py @ 5:cf65217ad61c draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/ivar/ commit a5ff06c631a2a5a0d5d44edd6cb58a599d50918b"
author iuc
date Wed, 19 May 2021 16:51:27 +0000
parents
children 5671e1d3d5ee
comparison
equal deleted inserted replaced
4:db536ad45f28 5:cf65217ad61c
1 #!/usr/bin/env python
2
3 # extends ivar trim's amplicon info parsing abilities
4 # to include calculation of amplicon regions from
5 # sets of nested (more than two) primers
6
7 import sys
8
9
10 # parse primers and their start positions from BED file
11 primer_starts = {}
12 with open(sys.argv[1]) as i:
13 for line in i:
14 f = line.strip().split('\t')
15 try:
16 if f[5] == '+':
17 primer_starts[f[3]] = int(f[1])
18 elif f[5] == '-':
19 primer_starts[f[3]] = int(f[2]) - 1
20 else:
21 raise ValueError()
22 except (IndexError, ValueError):
23 sys.exit(
24 'Primer BED file needs to be TAB-separated with the '
25 'following columns: '
26 'chrom, chromStart, chromEnd, name, score, strand, '
27 'where "chromStart", "chromEnd" need to be integer values '
28 'and "strand" needs to be either "+" or "-".'
29 )
30
31 # parse amplicon info and record outer primer names
32 with open(sys.argv[2]) as i:
33 ret_lines = []
34 for line in i:
35 first = last = None
36 for pname in line.strip().split('\t'):
37 try:
38 primer_start = primer_starts[pname]
39 except KeyError:
40 sys.exit(
41 'Amplicon info with primer name not found in '
42 f'primer BED file: "{pname}"'
43 )
44 if first is None or primer_start < primer_starts[first]:
45 first = pname
46 if last is None or primer_start > primer_starts[last]:
47 last = pname
48 if first == last:
49 sys.exit(
50 line
51 + 'is not a proper amplicon info line.'
52 )
53 ret_lines.append(f'{first}\t{last}\n')
54
55 # write amended amplicon info
56 with open(sys.argv[3], 'w') as o:
57 o.writelines(ret_lines)