annotate tools/annovar/annovar.sh @ 0:d3a72e55deca draft

Uploaded
author saskia-hiltemann
date Wed, 18 Sep 2013 10:51:20 -0400
parents
children 565c0e690238
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1 #!/bin/bash
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
3 test="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
4
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
5
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
6 function usage(){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
7 echo "usage: $0 todo"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
8 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
9
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
10 function runfilter(){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
11 ifile=$1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
12 columnname=$2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
13 threshold=$3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
14
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
15 if [[ $threshold == "-1" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
16 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
17 echo "not filtering"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
18 return
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
19 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
20
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
21 echo "filtering: $columnname, $threshold"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
22 cat $ifile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
23
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
24 #get column number corresponding to column header
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
25 column=`awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
26 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
27 col=-1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
28 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
29 if(FNR==1){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
30 for(i=1;i<=NF;i++){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
31 if($i == "'"${columnname}"'")
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
32 col=i
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
33 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
34 print col
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
35 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
36 }' $ifile `
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
37
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
38 if [ $column == -1 ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
39 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
40 echo "no such column, exiting"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
41 return
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
42 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
43
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
44 #perform filtering using the threshold
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
45 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
46 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
47 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
48 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
49 if(FNR==1)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
50 print $0;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
51 if(FNR>1){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
52 if( $"'"${column}"'" == "" ) # empty column, then print
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
53 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
54 else if ("'"${threshold}"'" == "text"){} #if set to text dont check threshold
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
55
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
56 else if ($"'"${column}"'" < "'"${threshold}"'") #else do check it
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
57 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
58 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
59 }' $ifile > tmpfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
60
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
61 mv tmpfile $ifile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
62 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
63
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
64 # arguments: originalfile,resultfile,chrcol,startcol,endcol,refcol,obscol,addcols
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
65 function joinresults(){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
66 ofile=$1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
67 rfile=$2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
68 colchr=$3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
69 colstart=$4
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
70 colend=$5
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
71 colref=$6
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
72 colobs=$7
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
73 addcols=$8 #e.g. "B.col1,B.col2"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
74
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
75 test="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
76
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
77 # echo "joining result with original file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
78 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
79 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
80 echo "ofile: $ofile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
81 head $ofile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
82 echo "rfile: $rfile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
83 head $rfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
84 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
85 numlines=`wc $rfile | cut -d" " -f2`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
86
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
87 # if empty results file, just add header fields
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
88 if [[ ! -s $rfile ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
89 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
90 dummycol=${addcols:2}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
91 outputcol=${dummycol//",B."/" "}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
92 numcommas=`echo "$addcols" | grep -o "," | wc -l`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
93
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
94 awk 'BEGIN{FS="\t";OFS="\t"}{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
95 if(FNR==1)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
96 print $0,"'"$outputcol"'";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
97 else{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
98 printf $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
99 for(i=0;i<="'"$numcommas"'"+1;i++)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
100 printf "\t"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
101 printf "\n"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
102 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
103 }END{}' $ofile > tempofile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
104
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
105 mv tempofile $ofile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
106 return
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
107 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
108
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
109
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
110 #get input file column names for cgatools join
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
111 col_chr_name=`head -1 $rfile | cut -f${colchr}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
112 col_start_name=`head -1 $rfile | cut -f${colstart}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
113 col_end_name=`head -1 $rfile | cut -f${colend}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
114 col_ref_name=`head -1 $rfile | cut -f${colref}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
115 col_obs_name=`head -1 $rfile | cut -f${colobs}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
116
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
117 #get annotation file column names for cgatools join
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
118 chr_name=`head -1 $ofile | cut -f${chrcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
119 start_name=`head -1 $ofile | cut -f${startcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
120 end_name=`head -1 $ofile | cut -f${endcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
121 ref_name=`head -1 $ofile | cut -f${refcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
122 obs_name=`head -1 $ofile | cut -f${obscol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
123
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
124 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
125 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
126 echo "input file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
127 echo "chr col: $col_chr_name ($colchr)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
128 echo "start col: $col_start_name ($colstart)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
129 echo "end col: $col_end_name ($colend)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
130 echo "ref col: $col_ref_name ($colref)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
131 echo "obs col: $col_obs_name ($colobs)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
132 echo ""
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
133 echo "annotation file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
134 echo "chr col: $chr_name ($chrcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
135 echo "start col: $start_name ($startcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
136 echo "end col: $end_name ($endcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
137 echo "ref col: $ref_name ($refcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
138 echo "obs col: $obs_name ($obscol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
139 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
140
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
141 #perform join
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
142 cgatools join --beta \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
143 --input $ofile $rfile \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
144 --output temporiginal \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
145 --match ${chr_name}:${col_chr_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
146 --match ${start_name}:${col_start_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
147 --match ${end_name}:${col_end_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
148 --match ${ref_name}:${col_ref_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
149 --match ${obs_name}:${col_obs_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
150 --select A.*,$addcols \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
151 --always-dump \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
152 --output-mode compact
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
153
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
154 #replace originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
155 sed -i 's/^>//g' temporiginal #join sometimes adds a '>' symbol to header
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
156 mv temporiginal originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
157
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
158 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
159 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
160 echo "joining complete"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
161 head originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
162 echo ""
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
163 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
164
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
165 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
166
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
167
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
168
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
169
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
170 set -- `getopt -n$0 -u -a --longoptions="inputfile: buildver: humandb: varfile: VCF: chrcol: startcol: endcol: refcol: obscol: vartypecol: convertcoords: geneanno: verdbsnp: tfbs: mce: cytoband: segdup: dgv: gwas: ver1000g: cg46: cg69: impactscores: esp: gerp: cosmic61: cosmic63: cosmic64: cosmic65: outall: outfilt: outinvalid: scriptsdir: dorunannovar: dofilter: filt_dbsnp: filt1000GALL: filt1000GAFR: filt1000GAMR: filt1000GASN: filt1000GEUR: filtESP6500ALL: filtESP6500EA: filtESP6500AA: filtcg46: filtcg69: dummy:" "h:" "$@"` || usage
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
171 [ $# -eq 0 ] && usage
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
172
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
173
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
174
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
175 while [ $# -gt 0 ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
176 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
177 case "$1" in
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
178 --inputfile) infile=$2;shift;; # inputfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
179 --buildver) buildver=$2;shift;; # hg18 or hg19
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
180 --humandb) humandb=$2;shift;; # location of humandb database
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
181 --varfile) varfile=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
182 --VCF) vcf=$2;shift;; #Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
183 --chrcol) chrcol=$2;shift;; # which column has chr
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
184 --startcol) startcol=$2;shift;; # which column has start
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
185 --endcol) endcol=$2;shift;; # which column has end
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
186 --refcol) refcol=$2;shift;; # which column has ref
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
187 --obscol) obscol=$2;shift;; # which column has alt
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
188 --vartypecol) vartypecol=$2;shift;; # which column has vartype
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
189 --convertcoords) convertcoords=$2;shift;; # Y or N convert coordinate from CG to 1-based?
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
190 --geneanno) geneanno=$2;shift;; # comma-separated list of strings refSeq, knowngene, ensgene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
191 --verdbsnp) verdbsnp=$2;shift;; #comma-separated list of dbsnp version to annotate with (e.g. "132,135NonFlagged,137")"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
192 --tfbs) tfbs=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
193 --mce) mce=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
194 --cytoband) cytoband=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
195 --segdup) segdup=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
196 --dgv) dgv=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
197 --gwas) gwas=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
198 --ver1000g) ver1000g=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
199 --cg46) cg46=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
200 --cg69) cg69=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
201 --impactscores) impactscores=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
202 --scriptsdir) scriptsdir=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
203 --esp) esp=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
204 --gerp) gerp=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
205 --cosmic61) cosmic61=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
206 --cosmic63) cosmic63=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
207 --cosmic64) cosmic64=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
208 --cosmic65) cosmic65=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
209 --filt_dbsnp) filt_dbsnp=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
210 --filt1000GALL) threshold_1000g_ALL=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
211 --filt1000GAFR) threshold_1000g_AFR=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
212 --filt1000GAMR) threshold_1000g_AMR=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
213 --filt1000GASN) threshold_1000g_ASN=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
214 --filt1000GEUR) threshold_1000g_EUR=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
215 --filtESP6500ALL) threshold_ESP6500_ALL=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
216 --filtESP6500EA) threshold_ESP6500_EA=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
217 --filtESP6500AA) threshold_ESP6500_AA=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
218 --filtcg46) threshold_cg46=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
219 --filtcg69) threshold_cg69=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
220 --outall) outfile_all=$2;shift;; # file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
221 --outfilt) outfile_filt=$2;shift;; # file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
222 --outinvalid) outfile_invalid=$2;shift;; #file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
223 --dorunannovar) dorunannovar=$2;shift;; #Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
224 --dofilter) dofilter=$2;shift;; #Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
225 -h) shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
226 --) shift;break;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
227 -*) usage;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
228 *) break;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
229 esac
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
230 shift
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
231 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
232
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
233
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
234 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
235 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
236 echo "dorunannovar: $dorunannovar"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
237 echo "infile: $infile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
238 echo "buildver: $buildver"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
239 echo "annovardb: $humandb"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
240 echo "verdbnsp: $verdbsnp"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
241 echo "geneanno: $geneanno"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
242 echo "tfbs: $tfbs"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
243 echo "mce: $mce"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
244 echo "cytoband: $cytoband"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
245 echo "segdup: $segdup"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
246 echo "dgv: $dgv"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
247 echo "gwas: $gwas"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
248 echo "g1000: ${g1000}"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
249 echo "cg46: ${cg46}"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
250 echo "cg69: ${cg69}"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
251 echo "impactscores: $impactscores"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
252 echo "esp: $esp"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
253 echo "gerp: $gerp"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
254 echo "cosmic: $cosmic"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
255 echo "outfile: $outfile_all"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
256 echo "outinvalid: $outfile_invalid"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
257 echo "outfiltered: $outfile_filt"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
258 echo "varfile: $varfile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
259 echo "vcf" $vcf
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
260 echo "chrcol: $chrcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
261 echo "startcol: $startcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
262 echo "endcol: $endcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
263 echo "refcol: $refcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
264 echo "obscol: $obscol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
265 echo "convertcoords: $convertcoords"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
266 echo "vartypecol: $vartypecol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
267 echo "dofilter: $dofilter"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
268 echo "threshold_1000g_ALL : $threshold_1000g_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
269 echo "threshold_1000g_AFR : $threshold_1000g_AFR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
270 echo "threshold_1000g_AMR : $threshold_1000g_AMR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
271 echo "threshold_1000g_ASN : $threshold_1000g_ASN"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
272 echo "threshold_1000g_EUR : $threshold_1000g_EUR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
273 echo "threshold_ESP6500_ALL: $threshold_ESP6500_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
274 echo "threshold_ESP6500_EA : $threshold_ESP6500_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
275 echo "threshold_ESP6500_AA : $threshold_ESP6500_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
276
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
277 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
278
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
279
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
280 refgene="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
281 knowngene="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
282 ensgene="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
283 #parse geneanno param
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
284 if [[ $geneanno =~ "refSeq" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
285 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
286 refgene="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
287 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
288 if [[ $geneanno =~ "knowngene" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
289 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
290 knowngene="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
291 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
292 if [[ $geneanno =~ "ensgene" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
293 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
294 ensgene="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
295 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
296
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
297
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
298 #parse verdbsnp/1000g/esp strings
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
299 dbsnpstr=${verdbsnp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
300 filt_dbsnpstr=${filt_dbsnp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
301 g1000str=${ver1000g//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
302 espstr=${esp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
303
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
304 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
305 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
306 echo "annotate dbsnp: $dbsnpstr"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
307 echo "annotate esp: $espstr"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
308 echo "filter dbsnp: $filt_dbsnpstr"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
309 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
310
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
311 mutationtaster="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
312 avsift="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
313 lrt="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
314 polyphen2="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
315 phylop="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
316 ljbsift="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
317 #parse impactscores param
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
318 if [[ $impactscores =~ "mutationtaster" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
319 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
320 mutationtaster="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
321 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
322 if [[ $impactscores =~ "sift" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
323 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
324 avsift="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
325 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
326 if [[ $impactscores =~ "lrt" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
327 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
328 lrt="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
329 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
330 if [[ $impactscores =~ "ljbsift" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
331 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
332 ljbsift="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
333 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
334 if [[ $impactscores =~ "pp2" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
335 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
336 polyphen2="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
337 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
338 if [[ $impactscores =~ "phylop" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
339 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
340 phylop="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
341 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
342
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
343 if [[ $varfile == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
344 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
345 convertcoords="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
346 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
347
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
348 #ljb refers to Liu, Jian, Boerwinkle paper in Human Mutation with pubmed ID 21520341. Cite this paper if you use the scores
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
349
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
350
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
351 #column header names we will be adding
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
352 # ESP 6500
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
353 esp6500si_colheader_ALL="ESP6500si_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
354 esp6500si_colheader_EA="ESP6500si_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
355 esp6500si_colheader_AA="ESP6500si_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
356 esp6500_colheader_ALL="ESP6500_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
357 esp6500_colheader_EA="ESP6500_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
358 esp6500_colheader_AA="ESP6500_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
359 esp5400si_colheader_ALL="ESP5400si_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
360 esp5400si_colheader_EA="ESP5400si_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
361 esp5400si_colheader_AA="ESP5400si_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
362 esp5400_colheader_ALL="ESP5400_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
363 esp5400_colheader_EA="ESP5400_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
364 esp5400_colheader_AA="ESP5400_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
365
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
366
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
367 # cg46 cg69
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
368 cg46_colheader="CG_46_genomes"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
369 cg69_colheader="CG_69_genomes"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
370
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
371 cp $infile originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
372 #run annovar or filter only?
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
373 if [ $dorunannovar == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
374 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
375
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
376
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
377 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
378 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
379 # PREPARE INPUT FILE
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
380 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
381 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
382
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
383 echo "converting input file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
384 vcfheader=""
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
385 if [ $vcf == "Y" ] #if CG varfile, convert
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
386 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
387 # convert vcf to annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
388 $scriptsdir/convert2annovar.pl --format vcf4 --includeinfo --outfile annovarinput $infile 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
389
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
390 #construct header line from vcf file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
391 cat $infile | grep "#CHROM" > additionalcols
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
392 sed -i 's/#//g' additionalcols
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
393 vcfheader="\t`cat additionalcols`"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
394 echo "vcfheader:$vcfheader"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
395 echo -e "chromosome\tbegin\tend\treference\tobserved\t`cat additionalcols`" > originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
396 cat annovarinput >> originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
397
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
398 chrcol=1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
399 startcol=2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
400 endcol=3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
401 refcol=4
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
402 obscol=5
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
403
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
404
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
405 elif [ $varfile == "Y" ] #if CG varfile, convert
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
406 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
407 # convert varfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
408 $scriptsdir/convert2annovar.pl --format cg --outfile annovarinput $infile 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
409 echo -e "chromosome\tbegin\tend\treference\talleleSeq\tvarType\thaplotype" > originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
410 cat annovarinput | cut -f1-6,8 >> originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
411 cat annovarinput | cut -f1-5 >> annovarinput2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
412 mv annovarinput2 annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
413
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
414 chrcol=1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
415 startcol=2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
416 endcol=3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
417 refcol=4
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
418 obscol=5
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
419
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
420 elif [ $convertcoords == "Y" ] # if CG-coordinates, convert
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
421 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
422 #echo "rearranging columns and converting coordinates"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
423 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
424 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
425 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
426 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
427 if(FNR>1) {
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
428 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
429 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
430 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" +=1; $"'"${obscol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
431 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
432
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
433 printf("%s\t%s\t%s\t%s\t%s\n" ,$"'"${chrcol}"'",$"'"${startcol}"'",$"'"${endcol}"'",$"'"${refcol}"'",$"'"${obscol}"'");
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
434 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
435 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
436 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
437 }' $infile > annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
438
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
439 #remove any "chr" prefixes
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
440 sed -i 's/chr//g' annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
441
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
442 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
443 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
444 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
445 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
446 if(FNR>=1) {
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
447 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
448 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
449 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" +=1; $"'"${obscol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
450 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
451
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
452 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
453 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
454 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
455 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
456 }' $infile > originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
457
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
458 #remove any "chr" prefixes
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
459 sed -i 's/chr//g' originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
460 sed -i 's/omosome/chromosome/g' originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
461
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
462
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
463 else #only rearrange columns if already 1-based coordinates
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
464 echo "rearranging columns "
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
465 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
466 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
467 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
468 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
469 if(FNR>1) {
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
470 printf("%s\t%s\t%s\t%s\t%s\n",$"'"${chrcol}"'",$"'"${startcol}"'",$"'"${endcol}"'",$"'"${refcol}"'",$"'"${obscol}"'");
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
471 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
472 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
473 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
474 }' $infile > annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
475
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
476 #remove any "chr" prefixes
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
477 sed -i 's/chr//g' annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
478 sed 's/chr//g' $infile > originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
479 sed -i 's/omosome/chromosome/g' originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
480 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
481
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
482 echo "...finished conversion"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
483
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
484
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
485
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
486
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
487 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
488 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
489 # RUN ANNOVAR COMMANDS
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
490 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
491 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
492
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
493
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
494
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
495 ###### gene-based annotation #######
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
496
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
497 # RefSeq Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
498 if [ $refgene == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
499 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
500 echo -e "\nrefSeq gene"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
501 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype gene annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
502
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
503 annovarout=annovarinput.variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
504 sed -i '1i\RefSeq_Func\tRefSeq_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
505 joinresults originalfile $annovarout 3 4 5 6 7 B.RefSeq_Func,B.RefSeq_Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
506
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
507 annovarout=annovarinput.exonic_variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
508 sed -i '1i\linenum\tRefSeq_ExonicFunc\tRefSeq_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
509 joinresults originalfile $annovarout 4 5 6 7 8 B.RefSeq_ExonicFunc,B.RefSeq_AAChange
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
510 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
511
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
512
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
513 # UCSC KnownGene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
514 if [ $knowngene == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
515 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
516 echo -e "\nUCSC known gene"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
517 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype knowngene annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
518
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
519 annovarout=annovarinput.variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
520 sed -i '1i\UCSCKnownGene_Func\tUCSCKnownGene_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
521 joinresults originalfile $annovarout 3 4 5 6 7 B.UCSCKnownGene_Func,B.UCSCKnownGene_Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
522
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
523 annovarout=annovarinput.exonic_variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
524 sed -i '1i\linenum\tUCSCKnownGene_ExonicFunc\tUCSCKnownGene_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
525 joinresults originalfile $annovarout 4 5 6 7 8 B.UCSCKnownGene_ExonicFunc,B.UCSCKnownGene_AAChange
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
526 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
527
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
528
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
529 # Emsembl Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
530 if [ $ensgene == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
531 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
532 echo -e "\nEnsembl gene"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
533 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype ensgene annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
534
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
535 annovarout=annovarinput.variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
536 sed -i '1i\EnsemblGene_Func\tEnsemblGene_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
537 joinresults originalfile $annovarout 3 4 5 6 7 B.EnsemblGene_Func,B.EnsemblGene_Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
538
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
539 annovarout=annovarinput.exonic_variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
540 sed -i '1i\linenum\tEnsemblGene_ExonicFunc\tEnsemblGene_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
541 joinresults originalfile $annovarout 4 5 6 7 8 B.EnsemblGene_ExonicFunc,B.EnsemblGene_AAChange
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
542 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
543
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
544
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
545
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
546 ###### region-based annotation #######
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
547
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
548
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
549 # Transcription Factor Binding Sites Annotation
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
550 if [ $mce == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
551 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
552 echo -e "\nMost Conserved Elements"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
553
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
554 if [ $buildver == "hg18" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
555 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
556 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype mce44way annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
557 annovarout=annovarinput.${buildver}_phastConsElements44way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
558 sed -i '1i\db\tphastConsElements44way\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
559 joinresults originalfile $annovarout 3 4 5 6 7 B.phastConsElements44way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
560
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
561 else #hg19
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
562 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype mce46way annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
563 annovarout=annovarinput.${buildver}_phastConsElements46way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
564 sed -i '1i\db\tphastConsElements46way\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
565 joinresults originalfile $annovarout 3 4 5 6 7 B.phastConsElements46way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
566 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
567
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
568 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
569
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
570
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
571
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
572 # Transcription Factor Binding Sites Annotation
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
573 if [ $tfbs == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
574 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
575 echo -e "\nTranscription Factor Binding Site Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
576 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype tfbs annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
577
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
578 # arguments: originalfile, resultfile,chrcol,startcol,endcol,refcol,obscol,selectcolumns
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
579 annovarout=annovarinput.${buildver}_tfbsConsSites
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
580 sed -i '1i\db\tTFBS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
581 joinresults originalfile $annovarout 3 4 5 6 7 B.TFBS
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
582 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
583
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
584
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
585
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
586 # Identify cytogenetic band for genetic variants
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
587 if [ $cytoband == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
588 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
589 echo -e "\nCytogenic band Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
590 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype band annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
591
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
592 annovarout=annovarinput.${buildver}_cytoBand
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
593 sed -i '1i\db\tBand\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
594 joinresults originalfile $annovarout 3 4 5 6 7 B.Band
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
595 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
596
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
597
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
598 # Identify variants located in segmental duplications
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
599 if [ $segdup == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
600 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
601 echo -e "\nSegmental Duplications Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
602 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype segdup annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
603
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
604 annovarout=annovarinput.${buildver}_genomicSuperDups
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
605 sed -i '1i\db\tSegDup\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
606 joinresults originalfile $annovarout 3 4 5 6 7 B.SegDup
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
607 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
608
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
609
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
610
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
611 # Identify previously reported structural variants in DGV
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
612 if [ $dgv == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
613 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
614 echo -e "\nDGV Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
615 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype dgv annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
616
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
617 annovarout=annovarinput.${buildver}_dgv
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
618 sed -i '1i\db\tDGV\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
619 joinresults originalfile $annovarout 3 4 5 6 7 B.DGV
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
620 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
621
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
622
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
623 # Identify variants reported in previously published GWAS studies
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
624 if [ $gwas == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
625 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
626 echo -e "\nGWAS Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
627 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype gwascatalog annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
628
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
629 annovarout=annovarinput.${buildver}_gwasCatalog
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
630 sed -i '1i\db\tGWAS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
631 joinresults originalfile $annovarout 3 4 5 6 7 B.GWAS
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
632 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
633
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
634
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
635
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
636
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
637 ###### filter-based annotation #######
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
638
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
639 #dbSNP
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
640 for version in $dbsnpstr
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
641 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
642 if [ $version == "None" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
643 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
644 break
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
645 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
646 echo -e "\ndbSNP region Annotation, version: $version"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
647 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ${version} annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
648
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
649 annovarout=annovarinput.${buildver}_${version}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
650 sed -i '1i\db\tdb'${version}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
651 joinresults originalfile $annovarout 3 4 5 6 7 B.db${version}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
652
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
653
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
654 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
655
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
656
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
657
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
658 #1000 Genomes
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
659
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
660 if [ $ver1000g != "None" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
661 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
662
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
663 for version in $g1000str
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
664 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
665 #column headers
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
666 g1000_colheader_ALL="${version}_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
667 g1000_colheader_AFR="${version}_AFR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
668 g1000_colheader_AMR="${version}_AMR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
669 g1000_colheader_ASN="${version}_ASN"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
670 g1000_colheader_EUR="${version}_EUR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
671 g1000_colheader_CEU="${version}_CEU"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
672 g1000_colheader_YRI="${version}_YRI"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
673 g1000_colheader_JPTCHB="${version}_JPTCHB"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
674
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
675 doALL="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
676 doAMR="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
677 doAFR="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
678 doASN="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
679 doEUR="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
680 doCEU="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
681 doYRI="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
682 doJPTCHB="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
683
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
684
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
685 if [ $version == "1000g2012apr" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
686 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
687 fileID="2012_04"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
688 doALL="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
689 if [ $buildver == "hg19" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
690 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
691 doAMR="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
692 doAFR="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
693 doASN="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
694 doEUR="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
695 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
696 elif [[ $version == "1000g2012feb" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
697 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
698 fileID="2012_02"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
699 doALL="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
700 elif [[ $version == "1000g2010nov" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
701 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
702 fileID="2010_11"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
703 doALL="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
704 elif [[ $version == "1000g2010jul" && $buildver == "hg18" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
705 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
706 fileID="2010_07"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
707 doALL="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
708 doCEU="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
709 doYRI="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
710 doJPTCHB="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
711 else
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
712 echo "unrecognized 1000g version, skipping"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
713 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
714
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
715 #ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
716 if [ $doALL == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
717 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
718 echo -e "\n1000Genomes ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
719 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_all" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
720
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
721 annovarout=annovarinput.${buildver}_ALL.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
722 sed -i '1i\db\t'$g1000_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
723 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
724 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
725
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
726 # AFR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
727 if [ $doAFR == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
728 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
729 echo -e "\n1000Genomes AFR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
730 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_afr" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
731
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
732 annovarout=annovarinput.${buildver}_AFR.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
733 sed -i '1i\db\t'$g1000_colheader_AFR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
734 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_AFR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
735 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
736
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
737
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
738 # AMR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
739 if [ $doAMR == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
740 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
741 echo -e "\n1000Genomes AMR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
742 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_amr" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
743
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
744 annovarout=annovarinput.${buildver}_AMR.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
745 sed -i '1i\db\t'$g1000_colheader_AMR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
746 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_AMR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
747 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
748
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
749 # ASN
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
750 if [ $doASN == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
751 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
752 echo -e "\n1000Genomes ASN"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
753 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_asn" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
754
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
755 annovarout=annovarinput.${buildver}_ASN.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
756 sed -i '1i\db\t'$g1000_colheader_ASN'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
757 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_ASN
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
758 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
759
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
760 # EUR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
761 if [ $doEUR == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
762 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
763 echo -e "\n1000Genomes EUR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
764 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_eur" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
765
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
766 annovarout=annovarinput.${buildver}_EUR.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
767 sed -i '1i\db\t'$g1000_colheader_EUR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
768 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_EUR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
769 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
770
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
771 # CEU
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
772 if [ $doCEU == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
773 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
774 echo -e "\n1000Genomes CEU"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
775 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_ceu" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
776
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
777 annovarout=annovarinput.${buildver}_CEU.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
778 sed -i '1i\db\t'$g1000_colheader_CEU'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
779 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_CEU
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
780 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
781
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
782 # YRI
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
783 if [ $doYRI == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
784 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
785 echo -e "\n1000Genomes YRI"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
786 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_yri" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
787
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
788 annovarout=annovarinput.${buildver}_YRI.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
789 sed -i '1i\db\t'$g1000_colheader_YRI'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
790 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_YRI
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
791
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
792
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
793 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
794
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
795 #JPTCHB
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
796 if [ $doJPTCHB == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
797 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
798 echo -e "\n1000Genomes JPTCHB"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
799 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_jptchb" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
800
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
801 annovarout=annovarinput.${buildver}_JPTCHB.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
802 sed -i '1i\db\t'$g1000_colheader_JPTCHB'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
803 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_JPTCHB
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
804 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
805
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
806 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
807 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
808
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
809
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
810 # SIFT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
811 if [ $avsift == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
812 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
813 echo -e "\nSIFT Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
814 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype avsift annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
815
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
816 annovarout=annovarinput.${buildver}_avsift_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
817 sed -i '1i\db\tAVSIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
818 joinresults originalfile $annovarout 3 4 5 6 7 B.AVSIFT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
819 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
820
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
821 #ljb refers to Liu, Jian, Boerwinkle paper in Human Mutation with pubmed ID 21520341. Cite this paper if you use the scores
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
822 # SIFT2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
823 if [ $ljbsift == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
824 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
825 echo -e "\nSIFT Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
826 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_sift annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
827
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
828 annovarout=annovarinput.${buildver}_ljb_sift_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
829 sed -i '1i\db\tLJB_SIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
830 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB_SIFT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
831 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
832
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
833
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
834 # PolyPhen2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
835 if [ $polyphen2 == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
836 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
837 echo -e "\nPolyPhen Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
838 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_pp2 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
839
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
840 annovarout=annovarinput.${buildver}_ljb_pp2_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
841 sed -i '1i\db\tPolyPhen2\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
842 joinresults originalfile $annovarout 3 4 5 6 7 B.PolyPhen2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
843 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
844
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
845
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
846 # MutationTaster
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
847 if [ $mutationtaster == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
848 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
849 echo -e "\nMutationTaster Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
850 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_mt annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
851
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
852 annovarout=annovarinput.${buildver}_ljb_mt_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
853 sed -i '1i\db\tMutationTaster\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
854 joinresults originalfile $annovarout 3 4 5 6 7 B.MutationTaster
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
855 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
856
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
857
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
858 # LRT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
859 if [ $lrt == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
860 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
861 echo -e "\nLRT Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
862 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_lrt annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
863
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
864 annovarout=annovarinput.${buildver}_ljb_lrt_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
865 sed -i '1i\db\tLikelihoodRatioTestScore\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
866 joinresults originalfile $annovarout 3 4 5 6 7 B.LikelihoodRatioTestScore
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
867 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
868
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
869 # PhyloP
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
870 if [ $phylop == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
871 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
872 echo -e "\nPhyloP Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
873 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_phylop annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
874
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
875 annovarout=annovarinput.${buildver}_ljb_phylop_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
876 sed -i '1i\db\tPhyloP\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
877 joinresults originalfile $annovarout 3 4 5 6 7 B.PhyloP
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
878 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
879
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
880
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
881 ### ESP Exome Variant Server
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
882 if [ $esp != "None" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
883 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
884 echo -e "\nESP Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
885 for version in $espstr
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
886 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
887 echo "version: $version"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
888 # 6500si ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
889 if [ $version == "esp6500si_all" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
890 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
891 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_all annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
892
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
893 annovarout=annovarinput.${buildver}_esp6500si_all_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
894 sed -i '1i\db\t'$esp6500si_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
895 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
896 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
897
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
898
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
899 # 6500si European American
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
900 if [ $version == "esp6500si_ea" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
901 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
902 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_ea annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
903
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
904 annovarout=annovarinput.${buildver}_esp6500si_ea_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
905 sed -i '1i\db\t'$esp6500si_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
906 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_EA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
907 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
908
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
909 # 6500si African Americans
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
910 if [ $version == "esp6500si_aa" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
911 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
912 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_aa annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
913
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
914 annovarout=annovarinput.${buildver}_esp6500si_aa_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
915 sed -i '1i\db\t'$esp6500si_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
916 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_AA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
917 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
918
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
919
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
920 # 6500 ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
921 if [ $version == "esp6500_all" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
922 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
923 ls
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
924 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_all annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
925
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
926 annovarout=annovarinput.${buildver}_esp6500_all_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
927 sed -i '1i\db\t'$esp6500_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
928 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
929 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
930
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
931
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
932 # 6500 European American
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
933 if [ $version == "esp6500_ea" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
934 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
935 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_ea annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
936 annovarout=annovarinput.${buildver}_esp6500_ea_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
937 sed -i '1i\db\t'$esp6500_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
938 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_EA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
939 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
940
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
941 # 6500 African Americans
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
942 if [ $version == "esp6500_aa" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
943 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
944 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_aa annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
945
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
946 annovarout=annovarinput.${buildver}_esp6500_aa_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
947 sed -i '1i\db\t'$esp6500_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
948 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_AA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
949 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
950
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
951
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
952 # 5400 ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
953 if [ $version == "esp5400_all" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
954 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
955 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_all annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
956
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
957 annovarout=annovarinput.${buildver}_esp5400_all_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
958 sed -i '1i\db\t'$esp5400_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
959 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
960 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
961
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
962
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
963 # 5400 European American
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
964 if [ $version == "esp5400_ea" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
965 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
966 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_ea annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
967
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
968 annovarout=annovarinput.${buildver}_esp5400_ea_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
969 sed -i '1i\db\t'$esp5400_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
970 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_EA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
971 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
972
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
973 # 5400 African Americans
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
974 if [ $version == "esp5400_aa" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
975 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
976 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_aa annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
977
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
978 annovarout=annovarinput.${buildver}_esp5400_aa_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
979 sed -i '1i\db\t'$esp5400_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
980 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_AA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
981 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
982
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
983 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
984 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
985
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
986
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
987 #ESP6500
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
988 if [ $esp == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
989 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
990 echo -e "\nESP Annotation OLD"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
991 # ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
992 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_all annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
993
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
994 annovarout=annovarinput.${buildver}_esp6500si_all_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
995 sed -i '1i\db\t'$esp6500_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
996 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
997
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
998
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
999 # European American
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1000 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_ea annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1001
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1002 annovarout=annovarinput.${buildver}_esp6500si_ea_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1003 sed -i '1i\db\t'$esp6500_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1004 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_EA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1005
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1006 # African Americans
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1007 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_aa annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1008
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1009 annovarout=annovarinput.${buildver}_esp6500si_aa_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1010 sed -i '1i\db\t'$esp6500_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1011 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_AA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1012 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1013
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1014
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1015
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1016 #GERP++
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1017 if [ $gerp == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1018 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1019 echo -e "\nGERP++ Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1020 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype gerp++gt2 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1021
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1022 annovarout="annovarinput.${buildver}_gerp++gt2_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1023 sed -i '1i\db\tGERP++\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1024 joinresults originalfile $annovarout 3 4 5 6 7 B.GERP++
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1025 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1026
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1027
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1028 #COSMIC
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1029 if [[ $cosmic61 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1030 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1031 echo -e "\nCOSMIC61 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1032 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic61 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1033
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1034 annovarout="annovarinput.${buildver}_cosmic61_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1035 sed -i '1i\db\tCOSMIC61\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1036 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC61
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1037
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1038 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1039
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1040 if [[ $cosmic63 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1041 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1042 echo -e "\nCOSMIC63 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1043 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic63 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1044
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1045 annovarout="annovarinput.${buildver}_cosmic63_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1046 sed -i '1i\db\tCOSMIC63\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1047 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC63
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1048
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1049 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1050
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1051 if [[ $cosmic64 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1052 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1053 echo -e "\nCOSMIC64 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1054 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic64 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1055
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1056 annovarout="annovarinput.${buildver}_cosmic64_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1057 sed -i '1i\db\tCOSMIC64\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1058 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC64
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1059
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1060 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1061
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1062 if [[ $cosmic65 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1063 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1064 echo -e "\nCOSMIC65 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1065 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic65 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1066
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1067 annovarout="annovarinput.${buildver}_cosmic65_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1068 sed -i '1i\db\tCOSMIC65\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1069 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC65
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1070
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1071 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1072
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1073 #cg46
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1074 if [[ $cg46 == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1075 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1076 echo -e "\nCG 46 genomes Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1077 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cg46 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1078
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1079 annovarout="annovarinput.${buildver}_cg46_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1080 sed -i '1i\db\t'${cg46_colheader}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1081 joinresults originalfile $annovarout 3 4 5 6 7 B.${cg46_colheader}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1082
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1083 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1084
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1085
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1086 #cg69
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1087 if [[ $cg69 == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1088 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1089 echo -e "\nCG 69 genomes Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1090 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cg69 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1091
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1092 annovarout="annovarinput.${buildver}_cg69_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1093 sed -i '1i\db\t'${cg69_colheader}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1094 joinresults originalfile $annovarout 3 4 5 6 7 B.${cg69_colheader}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1095
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1096 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1097
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1098
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1099
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1100 if [ $convertcoords == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1101 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1102 echo "converting back coordinates"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1103 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1104 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1105 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1106 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1107 if (FNR==1)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1108 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1109 if(FNR>1) {
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1110 $"'"${chrcol}"'" = "chr"$"'"${chrcol}"'"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1111 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" -= 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1112 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1113 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" -=1; $"'"${obscol}"'" = "" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1114 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" -= 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1115 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1116
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1117 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1118 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1119 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1120 }' originalfile > originalfile_coords
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1121 else
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1122 mv originalfile originalfile_coords
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1123 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1124
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1125 #restore "chr" prefix?
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1126
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1127 #move to outputfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1128 if [ ! -s annovarinput.invalid_input ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1129 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1130 echo "Congrats, your input file contained no invalid lines!" > annovarinput.invalid_input
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1131 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1132
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1133 cp originalfile_coords $outfile_all
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1134 cp annovarinput.invalid_input $outfile_invalid 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1135 fi #if $dorunannovar
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1136
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1137
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1138
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1139
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1140
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1141 ############################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1142 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1143 # Filter Annotated Variants
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1144 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1145 ############################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1146
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1147
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1148 if [[ $dofilter == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1149 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1150 echo "starting filtering"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1151 cp originalfile filteredfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1152
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1153 ### do the filtering
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1154 # usage: runfilter <column name> <threshold> (-1=do not filter, 0=filter any value)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1155
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1156 #1000genomes
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1157 runfilter filteredfile ${g1000_colheader_ALL} ${threshold_1000g_ALL}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1158 runfilter filteredfile ${g1000_colheader_AFR} ${threshold_1000g_AFR}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1159 runfilter filteredfile ${g1000_colheader_AMR} ${threshold_1000g_AMR}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1160 runfilter filteredfile ${g1000_colheader_ASN} ${threshold_1000g_ASN}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1161 runfilter filteredfile ${g1000_colheader_EUR} ${threshold_1000g_EUR}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1162
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1163 #esp
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1164 runfilter filteredfile ${esp6500_colheader_ALL} ${threshold_ESP6500_ALL}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1165 runfilter filteredfile ${esp6500_colheader_EA} ${threshold_ESP6500_EA}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1166 runfilter filteredfile ${esp6500_colheader_AA} ${threshold_ESP6500_AA}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1167
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1168 #dbsnp
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1169 for version in $filt_dbsnpstr
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1170 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1171 if [ $version == "None" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1172 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1173 break
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1174 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1175 runfilter filteredfile "db$version" "text" #-42 will filter any non-empty string in that field
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1176
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1177 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1178
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1179 #complete genomics
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1180 runfilter filteredfile ${cg46_colheader} ${threshold_cg46}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1181 runfilter filteredfile ${cg69_colheader} ${threshold_cg69}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1182
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1183 #move filtered output file to galaxy output file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1184 cp filteredfile $outfile_filt
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1185
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1186 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1187
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1188
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1189
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1190
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1191
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1192
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1193
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1194
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1195
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1196
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1197
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1198
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1199
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1200
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1201
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1202
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1203