annotate PhageTerm.py @ 24:c8f88ae512f3 draft default tip

Uploaded
author mmonot
date Tue, 17 Sep 2024 13:35:16 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
24
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
1 #! /usr/bin/env python
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
2 # -*- coding: utf-8 -*-
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
3
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
4 # This file is a part of PhageTerm software
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
5 # A tool to determine phage termini and packaging strategy
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
6 # and other useful informations using raw sequencing reads.
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
7 # (This programs works with sequencing reads from a randomly
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
8 # sheared DNA library preparations as Illumina TruSeq paired-end or similar)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
9 #
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
10 # ----------------------------------------------------------------------
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
11 # Copyright (C) 2017 Julian Garneau
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
12 #
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
13 # This program is free software; you can redistribute it and/or modify
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
14 # it under the terms of the GNU General Public License as published by
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
15 # the Free Software Foundation; either version 3 of the License, or
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
16 # (at your option) any later version.
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
17 # <http://www.gnu.org/licenses/gpl-3.0.html>
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
18 #
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
19 # This program is distributed in the hope that it will be useful,
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
20 # but WITHOUT ANY WARRANTY; without even the implied warranty of
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
21 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
22 # GNU General Public License for more details.
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
23 # ----------------------------------------------------------------------
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
24 #
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
25 # @author Julian Garneau <julian.garneau@usherbrooke.ca>
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
26 # @author Marc Monot <marc.monot@pasteur.fr>
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
27 # @author David Bikard <david.bikard@pasteur.fr>
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
28
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
29
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
30 ### PYTHON Module
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
31 # Base
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
32 import os
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
33 import sys
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
34 from optparse import OptionParser, OptionGroup
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
35
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
36 # Multiprocessing
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
37 import multiprocessing
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
38 from multiprocessing import Manager
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
39 import numpy as np
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
40
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
41 # Project
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
42 from _modules.functions_PhageTerm import *
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
43
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
44 ### MAIN
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
45 # Option
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
46 usage = """\n\nUsage: %prog -f reads.fastq -r phage_sequence.fasta [-n phage_name -p reads_paired -s seed_lenght -d surrounding -t installation_test -c nbr_core -g host.fasta (warning increase process time)]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
47
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
48 Program: PhageTerm - Analyze phage termini and packaging mode using reads from high-throughput sequenced phage data
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
49 Version: 1.0.11
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
50 Contact: Julian Garneau <julian.garneau@usherbrooke.ca>
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
51 Contact: David Bikard <david.bikard@pasteur.fr>
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
52 Contact: Marc Monot <marc.monot@pasteur.fr>
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
53
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
54 You can perform a program test run upon installation using the "-t " option.
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
55 Arguments for the -t option can be : 5, 3, DS, DL, M or H.
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
56
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
57 Example of test commands :
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
58 PhageTerm.py.py -t C5 -> Test run for a 5\' cohesive end (e.g. Lambda)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
59 PhageTerm.py.py -t C3 -> Test run for a 3\' cohesive end (e.g. HK97)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
60 PhageTerm.py.py -t DS -> Test run for a Direct Terminal Repeats end short (e.g. T7)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
61 PhageTerm.py.py -t DL -> Test run for a Direct Terminal Repeats end long (e.g. T5)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
62 PhageTerm.py.py -t H -> Test run for a Headful packaging (e.g. P1)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
63 PhageTerm.py.py -t M -> Test run for a Mu-like packaging (e.g. Mu)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
64 """
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
65
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
66 getopt = OptionParser(usage=usage)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
67
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
68 optreads = OptionGroup(getopt, 'Raw reads file in fastq format')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
69 optreads.add_option('-f', '--fastq', dest='fastq', metavar='FILE', help='Fastq reads from Illumina TruSeq')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
70 getopt.add_option_group(optreads)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
71
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
72 optref = OptionGroup(getopt, 'Phage genome in fasta format')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
73 optref.add_option('-r', '--ref', dest='reference', metavar='FILE', help='Reference phage genome as unique contig in fasta format')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
74 getopt.add_option_group(optref)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
75
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
76 optname = OptionGroup(getopt, 'Name of the phage being analyzed by the user')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
77 optname.add_option('-n', '--phagename', dest='phagename', metavar='STRING', help='Manually enter the name of the phage being analyzed. Used as prefix for output files.')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
78 getopt.add_option_group(optname)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
79
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
80 optseed = OptionGroup(getopt, 'Lenght of the seed used for reads in the mapping process')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
81 optseed.add_option('-s', '--seed', dest='seed', metavar='INT', type="int", help='Manually enter the lenght of the seed used for reads in the mapping process.')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
82 getopt.add_option_group(optseed)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
83
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
84 optsurround = OptionGroup(getopt, 'Lenght of the surrounding region considered for peak value cumulation')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
85 optsurround.add_option('-d', '--surrounding', dest='surround', type="int", metavar='INT', help='Manually enter the lenght of the surrounding used to merge very close peaks in the analysis process.')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
86 getopt.add_option_group(optsurround)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
87
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
88 optcore = OptionGroup(getopt, 'Number of core processors to use (Default: 1)')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
89 optcore.add_option('-c', '--core', dest='core', metavar='INT', type="int", help='Manually enter the number of core you want to use.')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
90 getopt.add_option_group(optcore)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
91
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
92 opthost = OptionGroup(getopt, 'Host genome in fasta format')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
93 opthost.add_option('-g', '--host', dest='host', metavar='FILE', help='Reference host genome as unique contig in fasta format')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
94 getopt.add_option_group(opthost)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
95
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
96 optpaired = OptionGroup(getopt, 'Use paired-end reads')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
97 optpaired.add_option('-p', '--paired', dest='paired', metavar='FILE', help='Use paired-end reads to calculate real insert coverage')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
98 getopt.add_option_group(optpaired)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
99
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
100 optmean = OptionGroup(getopt, 'Defined phage mean coverage')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
101 optmean.add_option('-m', '--mean', dest='mean', metavar='INT', type="int", help='Defined phage mean coverage')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
102 getopt.add_option_group(optmean)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
103
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
104 opttest = OptionGroup(getopt, 'Perform a program test run upon installation')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
105 opttest.add_option('-t', '--test', dest='test', metavar='STRING', help='Perform a program test run upon installation. If you want to perform a test run, use the "-t " option. Arguments for the -t option can be : C5, C3, DS, DL, H or M. C5 -> Test run for a 5\' cohesive end (e.g. Lambda); C3 -> Test run for a 3\' cohesive end (e.g. HK97); DS -> Test run for a short Direct Terminal Repeats end (e.g. T7); DL -> Test run for a long Direct Terminal Repeats end (e.g. T5); H -> Test run for a Headful packaging (e.g. P1); M -> Test run for a Mu-like packaging (e.g. Mu)')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
106 getopt.add_option_group(opttest)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
107
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
108
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
109 ######
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
110
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
111 options, arguments = getopt.parse_args()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
112 fastq = options.fastq
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
113 reference = options.reference
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
114 phagename = options.phagename
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
115 seed = options.seed
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
116 surrounding = options.surround
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
117 core = options.core
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
118 host = options.host
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
119 paired = options.paired
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
120 mean = options.mean
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
121 test = options.test
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
122
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
123 ######
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
124
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
125 if options.fastq == None and options.test == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
126 getopt.error('\tNo reads file provided.\n\t\t\tUse -h or --help for more details\n')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
127
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
128 if options.reference == None and options.test == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
129 getopt.error('\tNo fasta reference file provided.\n\t\t\tUse -h or --help for more details\n')
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
130
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
131 if options.phagename == None and options.test == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
132 phagename = "Phagename"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
133
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
134 if options.seed == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
135 seed = 20
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
136
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
137 if options.surround == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
138 surrounding = 20
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
139
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
140 if options.core == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
141 core = 1
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
142
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
143 if options.host == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
144 host = ""
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
145
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
146 if options.paired == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
147 paired = ""
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
148
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
149 if options.mean == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
150 mean = 250
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
151
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
152 ######
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
153
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
154 if options.test == None:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
155 test_run = 0
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
156 else:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
157 test_run = 1
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
158
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
159
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
160 if options.test == "C5":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
161 print "\nPerforming a test run using test phage sequence with 5 prime cohesive overhang :"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
162 print "\npython PhageTerm.py -f test-data/COS-5.fastq -r test-data/COS-5.fasta -n TEST_cohesive_5_prime"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
163 fastq = "test-data/COS-5.fastq"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
164 reference = "test-data/COS-5.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
165 phagename = "Test-cohesive-5'"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
166
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
167
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
168 elif options.test == "C3":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
169 print "\nPerforming a test run using test phage sequence with 3 prime cohesive overhang:"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
170 print "\npython PhageTerm.py -f test-data/COS-3.fastq -r test-data/COS-3.fasta -n TEST_cohesive_3_prime"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
171 fastq = "test-data/COS-3.fastq"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
172 reference = "test-data/COS-3.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
173 phagename = "Test-cohesive-3'"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
174
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
175 elif options.test == "DS":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
176 print "\nPerforming a test run using test phage sequence with short direct terminal repeats (DTR-short) :"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
177 print "\npython PhageTerm.py -f test-data/DTR-short.fastq -r test-data/DTR-short.fasta -n TEST_short_direct_terminal_repeats"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
178 fastq = "test-data/DTR-short.fastq"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
179 reference = "test-data/DTR-short.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
180 phagename = "Test-short-direct-terminal-repeats"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
181
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
182 elif options.test == "DL":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
183 print "\nPerforming a test run using test phage sequence with long direct terminal repeats (DTR-long) :"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
184 print "\npython PhageTerm.py -f test-data/DTR-long.fastq -r test-data/DTR-long.fasta -n TEST_long_direct_terminal_repeats"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
185 fastq = "test-data/DTR-long.fastq"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
186 reference = "test-data/DTR-long.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
187 phagename = "Test-long-direct-terminal-repeats"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
188
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
189 elif options.test == "H":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
190 print "\nPerforming a test run using test phage sequence with headful packaging"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
191 print "\npython PhageTerm.py -f test-data/Headful.fastq -r test-data/Headful.fasta -n TEST_headful"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
192 fastq = "test-data/Headful.fastq"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
193 reference = "test-data/Headful.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
194 phagename = "Test-Headful"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
195 surrounding = 0
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
196
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
197 elif options.test == "M":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
198 print "\nPerforming a test run using test phage sequence with Mu-like packaging"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
199 print "\npython PhageTerm.py -f test-data/Mu-like_R1.fastq -p test-data/Mu-like_R2.fastq -r test-data/Mu-like.fasta -n TEST_Mu-like -g test-data/Mu-like_host.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
200 fastq = "test-data/Mu-like_R1.fastq"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
201 paired = "test-data/Mu-like_R2.fastq"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
202 reference = "test-data/Mu-like.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
203 host = "test-data/Mu-like_host.fasta"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
204 phagename = "Test-Mu-like"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
205 surrounding = 0
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
206
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
207 ######
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
208
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
209
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
210 # CHECK inputs
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
211 phagename = checkPhageName(phagename)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
212
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
213 if checkFastaFile(reference):
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
214 exit("ERROR in reference file")
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
215
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
216 if host != "":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
217 if checkFastaFile(host):
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
218 exit("ERROR in reference file")
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
219
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
220 # VARIABLE
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
221 edge = 500
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
222 insert_max = 1000
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
223 limit_fixed = 35
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
224 limit_preferred = 11
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
225 limit_coverage = max(50,mean*2)/core
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
226 Mu_threshold = 0.5
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
227 draw = 0
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
228 if seed < 15:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
229 seed = 15
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
230
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
231 # READS Number
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
232 tot_reads = totReads(fastq)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
233 if paired != "":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
234 tot_reads_paired = totReads(paired)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
235 if (tot_reads != tot_reads_paired):
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
236 print "\nWARNING: Number of reads between the two reads files differ, using single reads only\n"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
237 paired = ""
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
238
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
239 # REFERENCE sequence recovery and edge adds
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
240 refseq = genomeFastaRecovery(reference)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
241 refseq = refseq[-edge:] + refseq + refseq[:edge]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
242
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
243 # HOST sequence recovery
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
244 hostseq = genomeFastaRecovery(host)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
245 if len(hostseq) != 0 and len(hostseq) < len(refseq):
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
246 print "\nHost length < Phage length : removing host sequence."
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
247 hostseq = ""
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
248 if hostseq != "":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
249 hostseq = hostseq[-edge:] + hostseq + hostseq[:edge]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
250
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
251
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
252 ### COVERAGE
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
253 print "\nCalculating coverage values, please wait (may take a while)...\n"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
254
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
255 if not test_run and core == 1:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
256 print "If your computer has more than 1 processor, you can use the -c or --core option to speed up the process.\n\n"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
257
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
258 jobs = []
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
259 manager = Manager()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
260 return_dict = manager.dict()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
261
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
262 # Position in core split
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
263 file_split = int(tot_reads/core)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
264 position = []
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
265
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
266 l = range(int(tot_reads))
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
267 part = chunks(l, core)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
268 for i in range(core):
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
269 position.append(part.next()[0])
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
270
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
271 position = position + [int(tot_reads)]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
272
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
273 for i in range(0, core):
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
274 process = multiprocessing.Process(target=readsCoverage, args=(fastq, refseq, hostseq, tot_reads, seed, edge, paired, insert_max, core, i, return_dict, position[i], position[i+1], limit_coverage))
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
275 jobs.append(process)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
276
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
277 for j in jobs:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
278 j.start()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
279
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
280 for j in jobs:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
281 j.join()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
282
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
283 print "\n\nFinished calculating coverage values, the remainder should be completed rapidly\n"
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
284
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
285 # merging results
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
286 for core_id in range(core):
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
287 if core_id == 0:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
288 termini_coverage = return_dict[core_id][0]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
289 whole_coverage = return_dict[core_id][1]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
290 paired_whole_coverage = return_dict[core_id][2]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
291 phage_hybrid_coverage = return_dict[core_id][3]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
292 host_hybrid_coverage = return_dict[core_id][4]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
293 host_whole_coverage = return_dict[core_id][5]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
294 list_hybrid = return_dict[core_id][6]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
295 insert = return_dict[core_id][7].tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
296 paired_missmatch = return_dict[core_id][8]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
297 reads_tested = return_dict[core_id][9]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
298 else:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
299 termini_coverage += return_dict[core_id][0]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
300 whole_coverage += return_dict[core_id][1]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
301 paired_whole_coverage += return_dict[core_id][2]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
302 phage_hybrid_coverage += return_dict[core_id][3]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
303 host_hybrid_coverage += return_dict[core_id][4]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
304 host_whole_coverage += return_dict[core_id][5]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
305 list_hybrid += return_dict[core_id][6]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
306 insert += return_dict[core_id][7].tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
307 paired_missmatch += return_dict[core_id][8]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
308 reads_tested += return_dict[core_id][9]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
309
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
310 termini_coverage = termini_coverage.tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
311 whole_coverage = whole_coverage.tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
312 paired_whole_coverage = paired_whole_coverage.tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
313 phage_hybrid_coverage = phage_hybrid_coverage.tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
314 host_hybrid_coverage = host_hybrid_coverage.tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
315 host_whole_coverage = host_whole_coverage.tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
316 list_hybrid = list_hybrid.tolist()
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
317
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
318
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
319 # WHOLE Coverage : Average, Maximum and Minimum
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
320 added_whole_coverage, ave_whole_cov = wholeCov(whole_coverage, len(refseq))
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
321 added_paired_whole_coverage, ave_paired_whole_cov = wholeCov(paired_whole_coverage, len(refseq))
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
322 added_host_whole_coverage, ave_host_whole_cov = wholeCov(host_whole_coverage, len(hostseq))
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
323
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
324 drop_cov = testwholeCov(added_whole_coverage, ave_whole_cov, test_run)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
325
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
326 # NORM pic by whole coverage (1 base)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
327 if paired != "":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
328 paired_whole_coverage_test = maxPaired(paired_whole_coverage, whole_coverage)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
329 termini_coverage_norm, mean_nc = normCov(termini_coverage, paired_whole_coverage, ave_whole_cov/1.5, edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
330 else:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
331 termini_coverage_norm, mean_nc = normCov(termini_coverage, whole_coverage, ave_whole_cov/1.5, edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
332
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
333 # REMOVE edge
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
334 termini_coverage[0] = RemoveEdge(termini_coverage[0],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
335 termini_coverage[1] = RemoveEdge(termini_coverage[1],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
336 termini_coverage_norm[0] = RemoveEdge(termini_coverage_norm[0],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
337 termini_coverage_norm[1] = RemoveEdge(termini_coverage_norm[1],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
338 whole_coverage[0] = RemoveEdge(whole_coverage[0],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
339 whole_coverage[1] = RemoveEdge(whole_coverage[1],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
340 paired_whole_coverage[0] = RemoveEdge(paired_whole_coverage[0],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
341 paired_whole_coverage[1] = RemoveEdge(paired_whole_coverage[1],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
342 added_whole_coverage = RemoveEdge(added_whole_coverage,edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
343 added_paired_whole_coverage = RemoveEdge(added_paired_whole_coverage,edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
344 added_host_whole_coverage = RemoveEdge(added_host_whole_coverage,edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
345 phage_hybrid_coverage[0] = RemoveEdge(phage_hybrid_coverage[0],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
346 phage_hybrid_coverage[1] = RemoveEdge(phage_hybrid_coverage[1],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
347 host_whole_coverage[0] = RemoveEdge(host_whole_coverage[0],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
348 host_whole_coverage[1] = RemoveEdge(host_whole_coverage[1],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
349 host_hybrid_coverage[0] = RemoveEdge(host_hybrid_coverage[0],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
350 host_hybrid_coverage[1] = RemoveEdge(host_hybrid_coverage[1],edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
351 refseq = RemoveEdge(refseq,edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
352 if host != "":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
353 hostseq = RemoveEdge(hostseq,edge)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
354 gen_len = len(refseq)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
355 host_len = len(hostseq)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
356 if options.test == "DL":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
357 gen_len = 100000
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
358
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
359
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
360 # READS Total, Used and Lost
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
361 used_reads, lost_reads, lost_perc = usedReads(termini_coverage, reads_tested)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
362
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
363 # PIC Max
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
364 picMaxPlus, picMaxMinus, TopFreqH = picMax(termini_coverage, 5)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
365 picMaxPlus_norm, picMaxMinus_norm, TopFreqH_norm = picMax(termini_coverage_norm, 5)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
366 picMaxPlus_host, picMaxMinus_host, TopFreqH_host = picMax(host_whole_coverage, 5)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
367
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
368 ### ANALYSIS
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
369
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
370 ## Close Peaks
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
371 picMaxPlus, picOUT_forw = RemoveClosePicMax(picMaxPlus, gen_len, surrounding)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
372 picMaxMinus, picOUT_rev = RemoveClosePicMax(picMaxMinus, gen_len, surrounding)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
373 picMaxPlus_norm, picOUT_norm_forw = RemoveClosePicMax(picMaxPlus_norm, gen_len, surrounding)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
374 picMaxMinus_norm, picOUT_norm_rev = RemoveClosePicMax(picMaxMinus_norm, gen_len, surrounding)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
375
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
376 termini_coverage_close = termini_coverage[:]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
377 termini_coverage_close[0], picOUT_forw = addClosePic(termini_coverage[0], picOUT_forw)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
378 termini_coverage_close[1], picOUT_rev = addClosePic(termini_coverage[1], picOUT_rev)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
379
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
380 termini_coverage_norm_close = termini_coverage_norm[:]
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
381 termini_coverage_norm_close[0], picOUT_norm_forw = addClosePic(termini_coverage_norm[0], picOUT_norm_forw, 1)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
382 termini_coverage_norm_close[1], picOUT_norm_rev = addClosePic(termini_coverage_norm[1], picOUT_norm_rev, 1)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
383
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
384
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
385 ## Statistical Analysis
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
386 picMaxPlus_norm_close, picMaxMinus_norm_close, TopFreqH_norm = picMax(termini_coverage_norm_close, 5)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
387
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
388 if paired != "":
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
389 phage_norm, phage_plus_norm, phage_minus_norm = test_pics_decision_tree(paired_whole_coverage, termini_coverage, termini_coverage_norm, termini_coverage_norm_close)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
390 else:
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
391 phage_norm, phage_plus_norm, phage_minus_norm = test_pics_decision_tree(whole_coverage, termini_coverage, termini_coverage_norm, termini_coverage_norm_close)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
392
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
393
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
394 ## LI Analysis
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
395 picMaxPlus_close, picMaxMinus_close, TopFreqH = picMax(termini_coverage_close, 5)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
396
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
397 R1, AveFreq = ratioR1(TopFreqH, used_reads, gen_len)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
398 R2 = ratioR(picMaxPlus_close)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
399 R3 = ratioR(picMaxMinus_close)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
400
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
401 ArtPackmode, termini, forward, reverse = packMode(R1, R2, R3)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
402 ArtOrient = orientation(picMaxPlus_close, picMaxMinus_close)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
403 ArtcohesiveSeq, ArtPackmode = sequenceCohesive(ArtPackmode, refseq, picMaxPlus_close, picMaxMinus_close, gen_len/2)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
404
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
405
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
406 ### DECISION Process
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
407
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
408 # PEAKS Significativity
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
409 plus_significant = selectSignificant(phage_plus_norm, 1.0/gen_len, limit_preferred)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
410 minus_significant = selectSignificant(phage_minus_norm, 1.0/gen_len, limit_preferred)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
411
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
412 # DECISION
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
413 Redundant, Permuted, P_class, P_type, P_seqcoh, P_concat, P_orient, P_left, P_right, Mu_like = decisionProcess(plus_significant, minus_significant, limit_fixed, gen_len, paired, insert, R1, list_hybrid, used_reads, seed, phage_hybrid_coverage, Mu_threshold, refseq, hostseq)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
414
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
415
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
416 ### EXPORT Data
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
417
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
418 ## Statistics
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
419 ExportStatistics(phagename, whole_coverage, paired_whole_coverage, termini_coverage, phage_plus_norm, phage_minus_norm, paired, test_run)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
420
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
421 # Sequence
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
422 ExportCohesiveSeq(phagename, ArtcohesiveSeq, P_seqcoh, test_run)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
423 ExportPhageSequence(phagename, P_left, P_right, refseq, P_orient, Redundant, Mu_like, P_class, P_seqcoh, test_run)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
424
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
425 # Report
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
426 CreateReport(phagename, seed, added_whole_coverage, draw, Redundant, P_left, P_right, Permuted, P_orient, termini_coverage_norm_close, picMaxPlus_norm_close, picMaxMinus_norm_close, gen_len, tot_reads, P_seqcoh, phage_plus_norm, phage_minus_norm, ArtPackmode, termini, forward, reverse, ArtOrient, ArtcohesiveSeq, termini_coverage_close, picMaxPlus_close, picMaxMinus_close, picOUT_norm_forw, picOUT_norm_rev, picOUT_forw, picOUT_rev, lost_perc, ave_whole_cov, R1, R2, R3, host, host_len, host_whole_coverage, picMaxPlus_host, picMaxMinus_host, surrounding, drop_cov, paired, insert, phage_hybrid_coverage, host_hybrid_coverage, added_paired_whole_coverage, Mu_like, test_run, P_class, P_type, P_concat)
c8f88ae512f3 Uploaded
mmonot
parents:
diff changeset
427