annotate SpliceTrap.pl @ 5:2ebca9da5e42 draft default tip

planemo upload
author bioitcore
date Thu, 07 Sep 2017 17:39:24 -0400
parents adc0f7765d85
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
1 #!/usr/bin/perl
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
2 # Author: wuj@cshl.edu
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
3 # Modified: Baekdoo Kim (baegi7942@gmail.com)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
4 use strict;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
5 use Getopt::Long;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
6 use Data::Dumper;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
7 ####################
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
8 use Cwd;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
9 my $PROG = $0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
10 my $CUR_DIR = Cwd::abs_path(Cwd::cwd());
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
11 my $PROG_ABS_PATH = Cwd::abs_path($PROG);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
12 #my $SrcFolder=`dirname $PROG_ABS_PATH`;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
13 #chomp($SrcFolder);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
14 #my %config=do "$ENV{HOME}/.SpliceTrap.pl.ini";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
15 #my $SrcFolder=$config{SrcFolder};
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
16
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
17 my @programs = ('R','echo','cat','bash','perl','ln','mkdir','paste','grep','sort','basename','awk','wc','mv','cd','rm','split','head' );
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
18 foreach my $program (@programs)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
19 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
20 die ("CHECK: $program not found\n") if(system("hash $program >/dev/null"));
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
21
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
22 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
23
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
24 ####################
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
25 my $SrcFolder="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
26 my $MapSoftware="bowtie";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
27 my $DatabasePrefix="hg38";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
28 my $ReadFileFormat="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
29 my $ReadFile1Name="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
30 my $ReadFile2Name="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
31 my $CutoffLevel="M";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
32 my $Outputfolder=$CUR_DIR;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
33 my $OutputPrefix="Result";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
34 #my $CutoffOnly=0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
35 my $ReadSize=36;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
36 my $JunctionCut=5;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
37 my $onGalaxy_raw="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
38 my $onGalaxy_txt="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
39 my $BowtieThreads=1;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
40 my $noIRMstr="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
41 my $noIRM = 0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
42
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
43 my $num_args = $#ARGV;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
44 $onGalaxy_raw = $ARGV[$num_args-1];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
45 $onGalaxy_txt = $ARGV[$num_args];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
46
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
47 GetOptions (
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
48 "l:s"=>\$SrcFolder,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
49 "m:s"=>\$MapSoftware,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
50 "d:s"=>\$DatabasePrefix,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
51 # "f:s"=>\$ReadFileFormat,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
52 "1:s"=>\$ReadFile1Name,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
53 "2:s"=>\$ReadFile2Name,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
54 "c:s"=>\$CutoffLevel,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
55 "outdir:s"=>\$Outputfolder,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
56 "o:s"=>\$OutputPrefix,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
57 "j:i"=>\$JunctionCut,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
58 "s:i"=>\$ReadSize,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
59 "p:i"=>\$BowtieThreads,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
60 "noIRM|noirm"=>\$noIRM
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
61 # "local:s"=>\$local,
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
62 # "rerun"=>\$CutoffOnly
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
63 );
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
64 #-O for galaxy output
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
65
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
66
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
67 my $InputParaDes=" Usage of the script:
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
68 -l Base Location (required)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
69 -m Mapping software: [bowtie]/rmap
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
70 -d Database prefix: [hg18]/mm9/rn4/userdefined
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
71 -1 Read File 1
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
72 -2 Read File 2
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
73 -c Cutoff Level:H/[M]/L
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
74 Means High, Middle or Low
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
75 -j Junction reads requirement per junction for each exon-isoform [5]
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
76 -o Output prefix {Result}
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
77 -s Read Size [36]
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
78 --outdir Output folder [./]
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
79 -p Bowtie parameter, threads number, only use this when you don't use qsub [1]
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
80 --noIRM Skip the IRM correction step
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
81
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
82 This is a quick help, please refer to the README file for details.
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
83 ";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
84
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
85
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
86 if($SrcFolder eq "") {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
87 print "[CHECK] - Please provide the location of the script (option '-l')\n\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
88 exit;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
89 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
90
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
91 if($ReadFile2Name eq "")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
92 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
93 $ReadFile2Name = $ReadFile1Name;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
94 #trigger singled end mode
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
95 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
96
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
97 if($ReadFile1Name eq "" or $ReadFile2Name eq "" )
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
98 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
99 print $InputParaDes;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
100 exit;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
101 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
102
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
103 if($BowtieThreads < 1)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
104 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
105 print $InputParaDes;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
106 exit;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
107 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
108
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
109 if (! -e "$SrcFolder/db/$DatabasePrefix/parallel")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
110 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
111 print "CHECK: Error, the database you specified is not properly installed.\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
112 #print $InputParaDes;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
113 exit;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
114
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
115 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
116
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
117 if($CutoffLevel ne "H" and $CutoffLevel ne "M" and $CutoffLevel ne "L")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
118 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
119 print $InputParaDes;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
120 exit;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
121 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
122
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
123
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
124 $ReadFile1Name = Cwd::abs_path($ReadFile1Name);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
125 $ReadFile2Name = Cwd::abs_path($ReadFile2Name);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
126
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
127 #check the files
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
128 open(check,$ReadFile1Name) or die ("CHECK: Error when opening $ReadFile1Name\n");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
129 my $checkoneline = <check>;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
130 if(substr($checkoneline,0,1) eq ">")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
131 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
132 $ReadFileFormat = "fasta";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
133 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
134 elsif(substr($checkoneline,0,1) eq "@")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
135 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
136 $ReadFileFormat = "fastq";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
137 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
138 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
139 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
140 die("CHECK: ERROR:Please check $ReadFile1Name\n");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
141 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
142 close(check);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
143
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
144 open(check,$ReadFile2Name) or die ("CHECK: Error when opening $ReadFile2Name\n");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
145 my $checkoneline = <check>;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
146 if(substr($checkoneline,0,1) eq ">")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
147 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
148 die("CHECK: $ReadFile2Name has a different format as $ReadFile1Name\n") if ($ReadFileFormat ne "fasta");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
149 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
150 elsif(substr($checkoneline,0,1) eq "@")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
151 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
152 die("CHECK: $ReadFile2Name has a different format as $ReadFile1Name\n") if ($ReadFileFormat ne "fastq");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
153 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
154 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
155 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
156 die("CHECK: ERROR:Please check $ReadFile2Name\n");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
157 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
158 close(check);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
159
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
160 $Outputfolder= Cwd::abs_path($Outputfolder);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
161 if($Outputfolder eq "/tmp")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
162 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
163 while(-e $Outputfolder)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
164 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
165 my $random_foldername = random_sessid();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
166 $Outputfolder = "/tmp/".$random_foldername;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
167 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
168 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
169
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
170
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
171 if(! -e $Outputfolder)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
172 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
173 mkdir $Outputfolder or die "CHECK: cannot mkdir $Outputfolder\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
174 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
175 if(! -d $Outputfolder)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
176 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
177 die "CHECK: $Outputfolder is not a folder\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
178 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
179
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
180 if($MapSoftware eq "bowtie")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
181 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
182 print "CHECK: whether bowtie installed and in PATH\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
183 my $bowtiechecker=`bowtie --version`;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
184 if($bowtiechecker ne "")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
185 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
186 print "CHECK: bowtie found, information below:\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
187 print $bowtiechecker,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
188 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
189 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
190 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
191 die "CHECK: No bowtie found in PATH, EXIT!\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
192 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
193 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
194 elsif($MapSoftware eq "rmap")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
195 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
196 print "CHECK: checking rmap...\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
197 if(system("type rmap &>/dev/null") ==0 )
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
198 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
199 print "CHECK: rmap found, continue\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
200 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
201 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
202 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
203 die "CHECK: No rmap found in PATH, EXIT!\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
204 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
205 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
206 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
207 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
208 die "CHECK: option -m only takes rmap or bowtie as inputs\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
209 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
210
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
211 if($ReadSize == 0)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
212 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
213 die "CHECK: Please check option -s Read size\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
214 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
215
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
216 if($noIRM)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
217 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
218 $noIRMstr= "noirm";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
219 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
220
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
221 #write more checks later
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
222 print "PARAMETERS:\tMapping software: ",$MapSoftware,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
223 print "PARAMETERS:\tDatabase prefix: ",$DatabasePrefix,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
224 print "PARAMETERS:\tRead end 1: ",$ReadFile1Name,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
225 print "PARAMETERS:\tRead end 2: ",$ReadFile2Name,"\n" if($ReadFile2Name ne $ReadFile1Name);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
226 print "PARAMETERS:\tGalaxy_raw: ",$onGalaxy_raw,"\n"; #if($onGalaxy_raw ne "");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
227 print "PARAMETERS:\tGalaxy_txt: ",$onGalaxy_txt,"\n"; #if($onGalaxy_txt ne "");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
228 print "PARAMETERS:\tCutoff level: ",$CutoffLevel,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
229 print "PARAMETERS:\tJunction reads.min:",$JunctionCut,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
230 print "PARAMETERS:\tOutput folder: ",$Outputfolder,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
231 print "PARAMETERS:\tOutput prefix: ",$OutputPrefix,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
232 print "PARAMETERS:\tRead size: ",$ReadSize,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
233 print "PARAMETERS:\tBowtie threads #: ",$BowtieThreads,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
234 print "PARAMETERS:\tNo IRM.\n" if ($noIRM);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
235
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
236 if($MapSoftware eq "bowtie")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
237 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
238 print "=================STAGE 1 MAPPING===================\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
239 system("bash $SrcFolder/bin/mapping_bowtie.sh $ReadFile1Name $ReadFileFormat $DatabasePrefix $Outputfolder $SrcFolder $BowtieThreads");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
240 system("bash $SrcFolder/bin/mapping_bowtie.sh $ReadFile2Name $ReadFileFormat $DatabasePrefix $Outputfolder $SrcFolder $BowtieThreads") if($ReadFile2Name ne $ReadFile1Name);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
241 print "=================STAGE 2 ESTIMATION================\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
242 # ratio, log, nums
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
243 system("bash $SrcFolder/bin/batch_para_cov10p_fit.sh $ReadFile1Name $ReadFile2Name $OutputPrefix $ReadSize $DatabasePrefix $Outputfolder $SrcFolder $noIRMstr") ;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
244 print "=================STAGE 3 CUTOFF====================\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
245 # raw
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
246 system("bash $SrcFolder/bin/apply_cutoff.sh $OutputPrefix $CutoffLevel $Outputfolder $JunctionCut $SrcFolder $noIRMstr");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
247
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
248
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
249 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
250
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
251 if($MapSoftware eq "rmap")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
252 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
253 print "=================STAGE 1 MAPPING===================\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
254
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
255 system("bash $SrcFolder/bin/mapping_rmap.sh $ReadFile1Name $ReadFileFormat $DatabasePrefix $Outputfolder $SrcFolder") ;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
256 system("bash $SrcFolder/bin/mapping_rmap.sh $ReadFile2Name $ReadFileFormat $DatabasePrefix $Outputfolder $SrcFolder") if($ReadFile2Name ne $ReadFile1Name);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
257 print "=================STAGE 2 ESTIMATION================\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
258
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
259 system("bash $SrcFolder/bin/batch_para_cov10p_fit.sh $ReadFile1Name $ReadFile2Name $OutputPrefix $ReadSize $DatabasePrefix $Outputfolder $SrcFolder $noIRMstr") ;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
260 print "=================STAGE 3 CUTOFF====================\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
261 system("bash $SrcFolder/bin/apply_cutoff.sh $OutputPrefix $CutoffLevel $Outputfolder $JunctionCut $SrcFolder $noIRMstr");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
262
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
263
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
264 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
265
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
266 #print "============ALL DONE, OUTPUTFILE:$OutputPrefix.txt\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
267
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
268 if($onGalaxy_raw ne "" && $onGalaxy_txt ne "")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
269 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
270 print "OUTPUTFILE:$OutputPrefix.raw\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
271 system("grep -v na $Outputfolder/$OutputPrefix.raw >$onGalaxy_raw");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
272 print "OUTPUTFILE:$OutputPrefix.txt\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
273 system("grep -v na $Outputfolder/$OutputPrefix.txt >$onGalaxy_txt");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
274 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
275
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
276 print "============Clean up\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
277 system("rm -r $Outputfolder/$OutputPrefix.*");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
278
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
279 sub random_sessid {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
280 #my @chars = (0..9,a..z,A..Z);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
281 my @chars = ('a'..'z','A'..'Z');
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
282 my $len = 10;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
283 my $string = join '', map {$chars[rand(@chars)]} (1..$len);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
284 return $string;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
285 }