comparison cpt.py @ 4:8f6c09b6a43d draft default tip

planemo upload commit 471832a126aa25d903becae9a074a6b7b1ff7092-dirty
author cpt
date Fri, 20 Sep 2024 04:02:40 +0000
parents 05b97a4dce94
children
comparison
equal deleted inserted replaced
3:859e18a9814a 4:8f6c09b6a43d
2 from Bio.Seq import Seq, reverse_complement, translate 2 from Bio.Seq import Seq, reverse_complement, translate
3 from Bio.SeqRecord import SeqRecord 3 from Bio.SeqRecord import SeqRecord
4 from Bio import SeqIO 4 from Bio import SeqIO
5 from Bio.Data import CodonTable 5 from Bio.Data import CodonTable
6 import logging 6 import logging
7 import regex as re
7 8
8 logging.basicConfig() 9 logging.basicConfig()
9 log = logging.getLogger() 10 log = logging.getLogger()
10 11
11 PHAGE_IN_MIDDLE = re.compile("^(?P<host>.*)\s*phage (?P<phage>.*)$") 12 PHAGE_IN_MIDDLE = re.compile("^(?P<host>.*)\s*phage (?P<phage>.*)$")
145 for match in self.re_stops.finditer(s, overlapped=True): 146 for match in self.re_stops.finditer(s, overlapped=True):
146 index = match.start() + 3 147 index = match.start() + 3
147 if index % 3 != 0: 148 if index % 3 != 0:
148 continue 149 continue
149 n = s[start:index] 150 n = s[start:index]
150 for (offset, n, t) in self.start_chop_and_trans(n): 151 for offset, n, t in self.start_chop_and_trans(n):
151 if n and len(t) >= self.min_len: 152 if n and len(t) >= self.min_len:
152 yield start + offset, n, t 153 yield start + offset, n, t
153 start = index 154 start = index
154 155
155 def putative_genes_in_sequence(self, nuc_seq): 156 def putative_genes_in_sequence(self, nuc_seq):
292 for match in self.re_stops.finditer(s, overlapped=True): 293 for match in self.re_stops.finditer(s, overlapped=True):
293 index = match.start() + 3 294 index = match.start() + 3
294 if index % 3 != 0: 295 if index % 3 != 0:
295 continue 296 continue
296 n = s[start:index] 297 n = s[start:index]
297 for (offset, n, t) in self.start_chop_and_trans(n): 298 for offset, n, t in self.start_chop_and_trans(n):
298 if n and len(t) >= self.min_len: 299 if n and len(t) >= self.min_len:
299 yield start + offset, n, t 300 yield start + offset, n, t
300 start = index 301 start = index
301 302
302 def putative_genes_in_sequence(self, nuc_seq): 303 def putative_genes_in_sequence(self, nuc_seq):