annotate VCFToolsStats/VCFToolsStats.pl @ 3:612066e3f57d draft

Uploaded
author gandres
date Mon, 09 Nov 2015 05:18:45 -0500
parents ac7c9e40d601
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
1
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
2 #!/usr/bin/perl
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
3
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
4 use strict;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
5 use Getopt::Long;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
6 use Bio::SeqIO;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
7
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
8 my $usage = qq~Usage:$0 <args> [<opts>]
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
9
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
10 where <args> are:
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
11
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
12 -i, --input <VCF input>
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
13 -o, --out <output basename>
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
14 ~;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
15 $usage .= "\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
16
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
17 my ($input,$out);
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
18
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
19 GetOptions(
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
20 "input=s" => \$input,
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
21 "out=s" => \$out
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
22 );
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
23
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
24
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
25 die $usage
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
26 if ( !$input);
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
27
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
28
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
29
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
30 my $nb_gene = `grep -c mRNA $input`;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
31 $nb_gene =~s/\n//g;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
32 my $nb_intergenic = `grep -c INTERGENIC $input`;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
33 $nb_intergenic =~s/\n//g;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
34
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
35 my $nb_intron = `grep -c INTRON $input`;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
36 $nb_intron =~s/\n//g;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
37 my $nb_UTR = `grep -c UTR $input`;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
38 $nb_UTR =~s/\n//g;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
39 my $nb_exon = $nb_gene - $nb_intron - $nb_UTR;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
40
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
41 my $nb_ns = `grep -c NON_SYNONYMOUS_CODING $input`;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
42 $nb_ns =~s/\n//g;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
43 my $nb_s = $nb_exon - $nb_ns;
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
44
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
45
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
46
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
47
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
48 #system("$VCFTOOLS_EXE --vcf $input --remove-filtered-all --out $out --hardy >>vcftools.log 2>&1");
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
49 system("vcftools --vcf $input --remove-filtered-all --out $out --het >>vcftools.log 2>&1");
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
50 system("vcftools --vcf $input --remove-filtered-all --out $out --TsTv-summary >>vcftools.log 2>&1");
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
51 system("vcftools --vcf $input --remove-filtered-all --out $out --missing-indv >>vcftools.log 2>&1");
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
52
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
53 open(my $G,">$out.annotation");
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
54 print $G "Genic $nb_gene\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
55 print $G "Intergenic $nb_intergenic\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
56 print $G "========\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
57 print $G "Intron $nb_intron\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
58 print $G "Exon $nb_exon\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
59 print $G "UTR $nb_UTR\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
60 print $G "========\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
61 print $G "Non-syn $nb_ns\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
62 print $G "Synonym $nb_s\n";
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
63 close($G);
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
64
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
65
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
66
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
67
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
68
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
69
ac7c9e40d601 Uploaded
gandres
parents:
diff changeset
70