annotate bin/scanbed2txdb.pl @ 4:cd336e593a92 draft

planemo upload
author bioitcore
date Thu, 07 Sep 2017 16:53:12 -0400
parents adc0f7765d85
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
1 #argv0: input transcript bed file
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
2 #argv1: output filename, will be in AS format
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
3
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
4 use strict;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
5 my $AnnoFileName = $ARGV[0];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
6 my $outputFileName = $ARGV[1];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
7
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
8 if($AnnoFileName eq "" or $outputFileName eq "")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
9 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
10 print "TXDBGEN: Please specify your input files\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
11 exit;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
12 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
13
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
14 my $cachefolder = `basename $outputFileName`;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
15 chomp($cachefolder);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
16 my $cachefolder = $cachefolder.".cache";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
17 my $AnnoFileBase = `basename $AnnoFileName`;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
18 chomp($AnnoFileBase);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
19
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
20 if(! -e $cachefolder)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
21 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
22 mkdir $cachefolder or die "CHECK: cannot mkdir $cachefolder\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
23 print "TXDBGEN: mkdir $cachefolder\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
24 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
25
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
26 my $CacheAnnoFileName = $cachefolder."/".$AnnoFileBase.".sort";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
27 #sort the annotation file
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
28
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
29 print "TXDBGEN: sort $AnnoFileName \n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
30
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
31 system("sort -k6,6 -k1,1 -k2,2n -k3,3n $AnnoFileName >$CacheAnnoFileName");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
32
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
33 $AnnoFileName = $CacheAnnoFileName;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
34
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
35 #read the annotations into hashes
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
36
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
37 open(AnnoFile, $CacheAnnoFileName) or die "can not open",$CacheAnnoFileName;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
38 #split the genes into contigs
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
39
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
40 my $contigid = 0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
41 my $end_tmp = 0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
42 my $chr_tmp = "chr";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
43 my $strand_tmp="NA";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
44
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
45 my $TXnumtmp=0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
46
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
47 my %eventlist =();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
48 #my %eventlist_af = ();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
49 #my %eventlist_al = ();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
50 my %evidences = ();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
51
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
52 open(my $output,">$outputFileName");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
53
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
54 open(my $output2, ">$outputFileName.evi");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
55 while(my $line =<AnnoFile>)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
56 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
57 chomp($line);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
58 my @a = split("\t",$line);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
59 my $chr = $a[0];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
60 my $start = $a[1];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
61 my $end = $a[2];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
62 my $name = $a[3];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
63 my @sizes = split(",",$a[10]);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
64 my $strand = $a[5];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
65 my @start_shifts = split(",",$a[11]);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
66 #my $chrstr = $chr.$strand;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
67 my @starts;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
68 my @ends;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
69 for(my $i=0;$i<@start_shifts;$i++)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
70 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
71 $starts[$i]=$start_shifts[$i]+$start;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
72 $ends[$i] = $starts[$i]+$sizes[$i];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
73 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
74 if($start >$end_tmp or $chr ne $chr_tmp or $strand_tmp ne $strand)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
75 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
76 $contigid++;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
77 #$ctgmultisonum++ if $TXnumtmp>1;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
78 $TXnumtmp=0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
79 my $annos = scanevents(\%eventlist, "inner") ;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
80 #my $annos_af = scanevents(\%eventlist_af, "af");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
81 #my $annos_al = scanevents(\%eventlist_al, "al");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
82
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
83 my $stdout = select ($output);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
84 my $eventids = printanno($annos,$chr_tmp,$strand_tmp) if(scalar(%$annos)>0);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
85 #printanno($annos_af,$chr_tmp,$strand_tmp) if(scalar(%$annos_af)>0);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
86 #printanno($annos_al,$chr_tmp,$strand_tmp) if(scalar(%$annos_al)>0);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
87 select($stdout);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
88 $stdout = select ($output2);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
89 #print cross information
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
90 foreach my $connect_str (keys %$eventids)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
91 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
92 print $eventids->{$connect_str},"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
93 foreach my $transcriptid (keys %{$evidences{$connect_str}})
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
94 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
95 print $transcriptid,",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
96 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
97 print "\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
98 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
99 select($stdout);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
100 print "TXDBGEN: Contig ID $contigid at $chr $strand...\n" if ( $contigid%1000 == 0);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
101 %eventlist = ();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
102 #%eventlist_al = ();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
103 #%eventlist_af = ();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
104 #print CacheContigFile "#ctg$contigid\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
105
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
106 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
107 $TXnumtmp++;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
108 $end_tmp = $end if ($end > $end_tmp or $chr ne $chr_tmp or $strand_tmp ne $strand);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
109 $chr_tmp = $chr;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
110
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
111 $strand_tmp = $strand;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
112
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
113 #scan connections, 2 and 3 exons for CA/CS/AF
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
114 # if(scalar(@starts)>2)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
115 # {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
116 # my $connectionstr_af =$starts[0]."-".
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
117 # $ends[0].",".
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
118 # $starts[1]."-".
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
119 # $ends[1]."," ;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
120 #
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
121 # $eventlist_af{$connectionstr_af} = $starts[0];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
122 # my $connectionstr_al = $starts[scalar(@starts)-2]."-".
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
123 # $ends[scalar(@starts)-2].",".
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
124 # $starts[scalar(@starts)-1]."-".
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
125 # $ends[scalar(@starts)-1]."," ;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
126 # $eventlist_al{$connectionstr_al} = $starts[scalar(@starts)-2];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
127 # }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
128 #didn't consider direction yet
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
129 #add 1 exon for IR
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
130 for(my $n=1;$n<4;$n++)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
131 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
132 for(my $i=0;$i<scalar(@starts)-$n+1;$i++)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
133 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
134 my $connectionstr = "";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
135 for(my $j=$i;$j<$i+$n;$j++)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
136 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
137 $connectionstr = $connectionstr .
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
138 $starts[$j]."-".
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
139 $ends[$j].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
140 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
141 # print $connectionstr,"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
142 $eventlist{$connectionstr} = $n;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
143 $evidences{$connectionstr}{$name} = 1;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
144 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
145
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
146 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
147
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
148 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
149
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
150 my $annos = scanevents(\%eventlist, "inner");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
151 #my $annos_af = scanevents(\%eventlist_af, "af");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
152 #my $annos_al = scanevents(\%eventlist_al, "al");
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
153
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
154 my $stdout = select ($output);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
155 my $eventids = printanno($annos,$chr_tmp,$strand_tmp) if(scalar(%$annos)>0);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
156 select ($stdout);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
157 $stdout = select ($output2);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
158 #print cross information
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
159 foreach my $connect_str (keys %$eventids)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
160 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
161 print $eventids->{$connect_str},"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
162 foreach my $transcriptid (keys %{$evidences{$connect_str}})
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
163 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
164 print $transcriptid,",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
165 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
166 print "\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
167 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
168
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
169 select($stdout);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
170
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
171 close($output);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
172 close($output2);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
173
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
174 #close(CacheContigFile);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
175 #define sub scanevents
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
176 sub scanevents
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
177 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
178 my ($eventlist,$mode)=@_;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
179 my %anno=();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
180 if($mode eq "inner")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
181 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
182 foreach my $key (keys %$eventlist)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
183 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
184 #print $key,"\t",$eventlist->{$key},"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
185 if($eventlist->{$key} == 3)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
186 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
187 my @a=split(",",$key);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
188 my $connectstr_ca=$a[0].",".$a[2].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
189 if (exists $eventlist->{$connectstr_ca})
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
190 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
191 $anno{$key}="ca";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
192 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
193 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
194 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
195 $anno{$key}="cs";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
196 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
197 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
198 if($eventlist->{$key} == 2)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
199 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
200 my @a=split(/[,-]/,$key);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
201
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
202 my $connectstr_ir=$a[0]."-".$a[3].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
203 if (exists $eventlist->{$connectstr_ir})
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
204 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
205 $anno{$key}="ir";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
206 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
207 foreach my $search (keys %$eventlist)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
208 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
209 next if($eventlist->{$search}!=2);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
210 my $connectstr_ss="";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
211 my @b=split(/[,-]/,$search);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
212 if($a[0]==$b[0] && $a[3]==$b[3])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
213 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
214 if($a[1]==$b[1])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
215 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
216 next if ($b[2] == $a[2]);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
217 $connectstr_ss .= $a[0]."-".$a[1].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
218 if($b[2]>$a[2])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
219 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
220 $connectstr_ss .= $a[2]."-".$b[2].",".$b[2];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
221 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
222 #elsif($b[2]<$a[2])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
223 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
224 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
225 $connectstr_ss .= $b[2]."-".$a[2].",".$a[2];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
226 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
227 $connectstr_ss .= "-".$a[3].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
228 $anno{$connectstr_ss}="ss";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
229 #print $connectstr_ss,"\tss\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
230 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
231 if($a[2]==$b[2])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
232 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
233 $connectstr_ss .= $a[0]."-";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
234 if($b[1]>$a[1])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
235 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
236 $connectstr_ss .= $a[1].",".$a[1]."-".$b[1];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
237 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
238 #elsif($b[2]<$a[2])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
239 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
240 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
241 $connectstr_ss .= $b[1].",".$b[1]."-".$a[1];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
242 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
243 $connectstr_ss .= ",".$a[2]."-".$a[3].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
244 $anno{$connectstr_ss}="ss";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
245 #print $connectstr_ss,"\tss\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
246 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
247
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
248
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
249 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
250
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
251 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
252 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
253 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
254 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
255 if($mode eq "af" or $mode eq "al")#alternative first/last exon
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
256 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
257 foreach my $key (keys %$eventlist)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
258 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
259 my @a=split(/,/,$key);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
260 foreach my $search (keys %$eventlist)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
261 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
262 next if $search eq $key;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
263 my $connectstr = "";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
264 if($eventlist->{$search} < $eventlist->{$key} )
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
265 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
266 $connectstr = $search."|".$key;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
267 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
268 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
269 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
270 $connectstr = $key."|".$search;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
271 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
272 next if exists $anno{$connectstr};
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
273 my @b=split(/,/,$search);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
274 if($mode eq "af")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
275 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
276 if($a[0] ne $b[0] and $a[1] eq $b[1])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
277 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
278 $anno{$connectstr} = $mode;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
279 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
280 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
281 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
282 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
283 if($a[0] eq $b[0] and $a[1] ne $b[1])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
284 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
285 $anno{$connectstr} = $mode;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
286 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
287 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
288
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
289 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
290 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
291 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
292 return(\%anno);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
293 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
294
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
295
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
296 sub printanno
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
297 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
298 # print the annotations
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
299 # and return the connectstr and event id to be used to print evidences
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
300 my %eventids=();
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
301 my ($annos,$chr,$strand)=@_;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
302 my %nums_per_isoform;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
303 foreach my $key (keys %$annos)
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
304 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
305 if($annos->{$key} eq "af")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
306 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
307 my @a=split(/[\,\-\|]+/,$key);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
308 my $chrid=substr($chr,3,length($chr)-3);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
309 my $id_anno="AF";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
310 #consider direction later
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
311 my $id=join("-",$id_anno,$id_anno, $a[2],$a[3]);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
312 my $num=0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
313 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
314 $nums_per_isoform{$id}++;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
315
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
316 print $chr,"\t",$a[0],"\t",$a[3],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
317 print $id.".".$num,"[L]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
318 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
319 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
320 print $a[0],"\t",$a[3],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
321 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
322 print "2\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
323 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
324 print $a[3]-$a[2],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
325 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
326 print $a[2]-$a[0],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
327
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
328 print $chr,"\t",$a[4],"\t",$a[7],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
329 print $id.".".$num,"[R]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
330 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
331 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
332 print $a[4],"\t",$a[7],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
333 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
334 print "2\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
335 print $a[5]-$a[4],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
336 print $a[7]-$a[6],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
337 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
338 print $a[6]-$a[4],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
339
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
340 #print "$key,af\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
341 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
342 if($annos->{$key} eq "ca" or $annos->{$key} eq "cs")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
343 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
344 my @a=split(/[,-]/,$key);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
345
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
346 my $chrid=substr($chr,3,length($chr)-3);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
347 my $id_anno="CS";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
348 $id_anno="CA" if $annos->{$key} eq "ca";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
349 my $id="CA-$id_anno-$chrid"."-".$a[2]."-".$a[3];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
350 my $num=0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
351 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
352 $nums_per_isoform{$id}++;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
353
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
354 print $chr,"\t",$a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
355 print $id.".".$num,"[L]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
356 $eventids {$key} = $id.".".$num."[L]";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
357 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
358 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
359 print $a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
360 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
361 print "3\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
362 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
363 print $a[3]-$a[2],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
364 print $a[5]-$a[4],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
365 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
366 print $a[2]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
367 print $a[4]-$a[0],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
368
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
369 print $chr,"\t",$a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
370 print $id.".".$num,"[S]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
371 my $connectstr_ca= $a[0]."-".$a[1].",".$a[4]."-".$a[5].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
372 $eventids{$connectstr_ca} = $id.".".$num."[S]";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
373 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
374 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
375 print $a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
376 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
377 print "2\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
378 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
379 #print $a[3]-$a[2],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
380 print $a[5]-$a[4],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
381 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
382 #print $a[2]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
383 print $a[4]-$a[0],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
384
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
385 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
386 if($annos->{$key} eq "ir")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
387 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
388 my @a=split(/[,-]/,$key);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
389
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
390 my $chrid=substr($chr,3,length($chr)-3);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
391 my $id="IR-IR-$chrid"."-".$a[1]."-".$a[2];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
392 my $num=0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
393 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
394 $nums_per_isoform{$id}++;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
395
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
396 print $chr,"\t",$a[0],"\t",$a[3],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
397 print $id.".".$num,"[L]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
398 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
399 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
400 print $a[0],"\t",$a[3],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
401 $eventids{$a[0]."-".$a[3].","} = $id.".".$num."[L]";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
402 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
403 print "3\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
404 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
405 print $a[2]-$a[1],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
406 print $a[3]-$a[2],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
407 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
408 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
409 print $a[2]-$a[0],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
410
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
411 print $chr,"\t",$a[0],"\t",$a[3],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
412 print $id.".".$num,"[S]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
413 $eventids{$key} = $id.".".$num."[S]";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
414 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
415 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
416 print $a[0],"\t",$a[3],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
417 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
418 print "2\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
419 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
420 #print $a[3]-$a[2],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
421 print $a[3]-$a[2],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
422 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
423 #print $a[2]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
424 print $a[2]-$a[0],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
425
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
426 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
427 if($annos->{$key} eq "ss")
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
428 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
429 my @a=split(/[,-]/,$key);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
430 my $chrid=substr($chr,3,length($chr)-3);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
431 my $type="AA";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
432 if( ($strand eq "+" && $a[1]==$a[2]) or ($strand eq "-" && $a[3]==$a[4]))
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
433 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
434 $type="AD";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
435 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
436 my $id="$type-$type-$chrid"."-".$a[2]."-".$a[3];
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
437 my $connect_str_L = "";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
438 my $connect_str_S = "";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
439 if($a[1]==$a[2])
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
440 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
441 $connect_str_L = $a[0]."-".$a[3].",".$a[4]."-".$a[5].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
442 $connect_str_S = $a[0]."-".$a[1].",".$a[4]."-".$a[5].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
443 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
444 else
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
445 {
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
446 $connect_str_L = $a[0]."-".$a[1].",".$a[2]."-".$a[5].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
447 $connect_str_S = $a[0]."-".$a[1].",".$a[3]."-".$a[5].",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
448
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
449 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
450 my $num=0;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
451 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
452 $nums_per_isoform{$id}++;
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
453 print $chr,"\t",$a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
454 print $id.".".$num,"[L]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
455 $eventids {$connect_str_L} = $id.".".$num."[L]";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
456 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
457 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
458 print $a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
459 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
460 print "3\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
461 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
462 print $a[3]-$a[2],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
463 print $a[5]-$a[4],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
464 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
465 print $a[2]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
466 print $a[4]-$a[0],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
467
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
468 print $chr,"\t",$a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
469 print $id.".".$num,"[S]\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
470 $eventids {$connect_str_S} = $id.".".$num."[S]";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
471 print "0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
472 print $strand,"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
473 print $a[0],"\t",$a[5],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
474 print "255,0,0\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
475 print "2\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
476 print $a[1]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
477 #print $a[3]-$a[2],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
478 print $a[5]-$a[4],"\t";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
479 print "0,";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
480 #print $a[2]-$a[0],",";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
481 print $a[4]-$a[0],"\n";
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
482
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
483
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
484 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
485
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
486 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
487 return(\%eventids);
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
488
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
489 }
adc0f7765d85 planemo upload
bioitcore
parents:
diff changeset
490