ID	overlap sum	ten overlap sum	mean	standard deviation	z-score	p-value
$id	$id	$sum	$ten	$mean	$sd	$zscore	$prob

overlap sum

ten overlap sum

mean

standard deviation

z-score

p-value

$id

$sum

$ten

$mean

$sd

$zscore

$prob

bonafide reads

siRNAs

+ bonafide reads of size between $simin and $simax +

Genome

Exons

piRNAs

+ bonafide reads of size between $pimin and $pimax +

Genome

Exons

Uniquely mapped reads

+ +

Reads randomly assigned

+ +

+ "; +} + +sub futurette +{ + my ($file, $name, $png, $hash) = @_; + print $file " +

$name

+ "; + foreach my $k (sort keys %{$hash}) + { + print $file "$k
\n" ; + } + + print $file " +

"; + + foreach my $pn (@{$png}){print $file "

";} + + print $file " +

+ "; +} + +sub fut +{ + my ($file, $name, $hash) = @_; + print $file " +

$name

+ "; + + foreach my $k (sort { ${$hash}{$a} cmp ${$hash}{$b} } keys %{$hash}) + { + print $file "$k
\n" ; + } + + print $file " +

+ "; +} + +sub get_distri_exon +{ + my ($dir, $name) = @_; + my (@out,@group); + my $group = $dir.'/'.$name.'-subgroups-bonafide_reads-exons-*distribution-*.png'; + @group = glob $group; + foreach (my $g =0; $g <= $#group; $g++) + { + if ($group[$g] =~ /.*($name-subgroups-bonafide_reads-exons-.*distribution-.*\.png)/ ) + { + my $tmp = $1; + push @out, $1; + } + } + return (\@out); +} + +sub get_distri_TE +{ + my ($dir, $name) = @_; + my (@out,@group); + my $group = $dir.'/'.$name.'-subgroups-bonafide_reads-TE-*distribution-*.png'; + @group = glob $group; + foreach (my $g =0; $g <= $#group; $g++) + { + if ($group[$g] =~ /.*($name-subgroups-bonafide_reads-TE-.*distribution-.*\.png)/ ) + { + my $tmp = $1; + push @out, $1; + } + } + return (\@out); +} + +sub get_PPP +{ + my ($dir,$name) = @_; + my (%distri,@group); + my $group = $dir.'/'.$name.'-subgroups-bonafide_reads-TE-PPPartners-*'; + @group = glob $group; + + foreach (my $g =0; $g <= $#group; $g++) + { + if ($group[$g] =~ /.*($name-subgroups-bonafide_reads-TE-PPPartners-.*)/ ) + { + my $tmp = $1; + if ($tmp =~ /PPPartners-(.*?)-sens\.txt$/) + { + $distri{$1} = ['','','','','',''] unless exists $distri{$1}; + $distri{$1}->[0] = $tmp; + } + elsif ($tmp =~ /PPPartners-(.*?)-antisens\.txt$/) + { + $distri{$1} = ['','','','','',''] unless exists $distri{$1}; + $distri{$1}->[1] = $tmp; + } + elsif ($tmp =~ /PPPartners-(.*?)-sensPPP\.txt$/) + { + $distri{$1} = ['','','','','',''] unless exists $distri{$1}; + $distri{$1}->[2] = $tmp; + } + elsif ($tmp =~ /PPPartners-(.*?)-antisensPPP\.txt$/) + { + $distri{$1} = ['','','','','',''] unless exists $distri{$1}; + $distri{$1}->[3] = $tmp; + } + elsif ($tmp =~ /PPPartners-(.*?)-overlap_size\.txt$/) + { + $distri{$1} = ['','','','','',''] unless exists $distri{$1}; + $distri{$1}->[4] = $tmp; + } + elsif ($tmp =~ /PPPartners-(.*?)-histogram\.png$/) + { + $distri{$1} = ['','','','','',''] unless exists $distri{$1}; + $distri{$1}->[5] = $tmp; + } + } + } + return \%distri; +} + +sub PPPrint +{ + my ($h, $hash) = @_; + my $cmp = 0; + + print $h "

\n"; + print $h "

"; + while ( my ($k,$v) = each %{$hash} ) + { + print $h "

" if $cmp != 0 && $cmp % 2 == 0; + print $h " + +

$k

[5]\"/>

[4]\">ping pong signature

[2]\">sens reads with PPP

[3]\">reverse reads with PPP

[0]\">sens reads without PPP

[1]\">reverse reads without PPP

+ "; + $cmp++; + } + + print $h "

"; +} + +sub printDistri +{ + my ($h, $tab) = @_; + my ($txt, $name); + my $cmp = 0; + print $h "

\n"; + print $h "

"; + foreach my $k (@{$tab}) + { + if ($k =~ /(.*)-(.*)\.png$/) + { + $txt = $1.'-'.$2.'.txt'; + $name = $2; + } + print $h "

" if $cmp != 0 && $cmp % 2 == 0; + print $h " + +

$name

text file

+ "; + $cmp++; + } + + print $h "

"; +} + +sub mapnum +{ + my $dupmapnum = shift; + my $dupnum_genome = shift; + open (my $dupTE, $dupmapnum) || die "cannot open ".$dupmapnum."\n"; + my %dupnum_TE = (); + my $header = <$dupTE>; + while (<$dupTE>) + { + chomp $_; + my @dupline = split /\t/, $_; + $dupnum_TE{$dupline[0]} = $dupline[2]; + } + close $dupTE; + open (my $du_TE, '>'.$dupmapnum) || die "cannot open to write ".$dupmapnum."\n"; + print $du_TE "sequence\tduplicate\tgenome map num\tmap num\n"; + while (my ($k, $v) = each %dupnum_TE ) + { + my $hashRef = ${$dupnum_genome}{$k}; + print $du_TE "$k\t$hashRef->[0]\t$hashRef->[1]\t$v\n"; + } + close $du_TE; +} + +1;

mappers #: $ma

unique mappers #: $ma_uni

$id

bonafide reads

siRNAs

piRNAs

miRNAs

$name

$name

$k

$name