0
|
1 '''Filter VCFs on AD ratio.
|
|
2
|
|
3 Created on 24 Sep 2015
|
|
4
|
|
5 @author: alex
|
|
6 '''
|
|
7
|
|
8 import argparse
|
|
9 import logging
|
|
10
|
|
11 from phe.variant_filters import PHEFilterBase
|
|
12
|
|
13
|
|
14 class ADFilter(PHEFilterBase):
|
|
15 '''Filter sites by AD ratio.'''
|
|
16
|
|
17
|
|
18 name = "ADRatio"
|
|
19 _default_threshold = 0.9
|
|
20 parameter = "ad_ratio"
|
|
21
|
|
22 @classmethod
|
|
23 def customize_parser(self, parser):
|
|
24 arg_name = self.parameter.replace("_", "-")
|
|
25 parser.add_argument("--%s" % arg_name, type=float, default=self._default_threshold,
|
|
26 help="Filter sites below minimum ad ratio (default: %s)" % self._default_threshold)
|
|
27
|
|
28 def __init__(self, args):
|
|
29 """AD Ratio constructor."""
|
|
30 # This needs to happen first, because threshold is initialised here.
|
|
31 super(ADFilter, self).__init__(args)
|
|
32
|
|
33 # Change the threshold to custom dp value.
|
|
34 self.threshold = self._default_threshold
|
|
35 if isinstance(args, argparse.Namespace):
|
|
36 self.threshold = args.ad_ratio
|
|
37 elif isinstance(args, dict):
|
|
38 try:
|
|
39 self.threshold = float(args.get(self.parameter))
|
|
40 except TypeError:
|
|
41 logging.error("Could not retrieve threshold from %s", args.get(self.parameter))
|
|
42 self.threshold = None
|
|
43
|
|
44
|
|
45 def __call__(self, record):
|
|
46 """Filter a :py:class:`vcf.model._Record`."""
|
|
47
|
|
48 if not record.is_snp:
|
|
49 return None
|
|
50
|
|
51 if len(record.samples) > 1:
|
|
52 logging.warn("More than 1 sample detected. Only first is considered.")
|
|
53
|
|
54 try:
|
|
55 record_ad = record.samples[0].data.AD
|
|
56
|
|
57 # FIXME: when record length is > 2, what do you do?
|
|
58 assert len(record_ad) == 2, "AD data is incomplete POS: %i" % record.POS
|
|
59
|
|
60 depth = sum(record.samples[0].data.AD)
|
|
61
|
|
62 ratio = float(record_ad[1]) / depth
|
|
63 except Exception:
|
|
64 logging.error("Could not calculate AD ratio from %s POS: %s", record_ad, record.POS)
|
|
65 ratio = None
|
|
66
|
|
67 if ratio is None or ratio < self.threshold:
|
|
68 # FIXME: When ratio is None, i.e. error, what do you do?
|
|
69 return ratio or False
|
|
70 else:
|
|
71 return None
|
|
72
|
|
73 def short_desc(self):
|
|
74 short_desc = self.__doc__ or ''
|
|
75
|
|
76 if short_desc:
|
|
77 short_desc = "%s (AD ratio > %s )" % (short_desc, self.threshold)
|
|
78
|
|
79 return short_desc
|