annotate tools/annovar/annovar.sh @ 8:d6af2a78617f draft

added support for databases upto 4 march 2016
author saskia-hiltemann
date Fri, 04 Mar 2016 11:32:50 -0500
parents 69e2067a120d
children f7ff063c738e
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1 #!/bin/bash
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
3 test="N"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
4 dofilter="N"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
5
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
6 #########################
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
7 # DEFINE SOME
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
8 # FUNCTIONS
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
9 #########################
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
10
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
11 function usage(){
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
12 echo "usage: $0 todo"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
13 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
14
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
15 function runfilter(){
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
16 ifile=$1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
17 columnname=$2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
18 threshold=$3
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
19
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
20 if [[ $threshold == "-1" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
21 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
22 echo "not filtering"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
23 return
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
24 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
25
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
26 echo "filtering: $columnname, $threshold"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
27 cat $ifile
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
28
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
29 #get column number corresponding to column header
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
30 column=`awk 'BEGIN{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
31 FS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
32 col=-1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
33 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
34 if(FNR==1){
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
35 for(i=1;i<=NF;i++){
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
36 if($i == "'"${columnname}"'")
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
37 col=i
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
38 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
39 print col
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
40 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
41 }' $ifile `
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
42
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
43 if [ $column == -1 ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
44 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
45 echo "no such column, exiting"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
46 return
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
47 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
48
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
49 #perform filtering using the threshold
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
50 awk 'BEGIN{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
51 FS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
52 OFS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
53 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
54 if(FNR==1)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
55 print $0;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
56 if(FNR>1){
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
57 if( $"'"${column}"'" == "" ) # empty column, then print
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
58 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
59 else if ("'"${threshold}"'" == "text"){} #if set to text dont check threshold
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
60
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
61 else if ($"'"${column}"'" < "'"${threshold}"'") #else do check it
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
62 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
63 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
64 }' $ifile > tmpfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
65
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
66 mv tmpfile $ifile
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
67 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
68
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
69 # arguments: originalfile,resultfile,chrcol,startcol,endcol,refcol,obscol,addcols
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
70 function joinresults(){
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
71 ofile=$1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
72 rfile=$2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
73 colchr=$3
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
74 colstart=$4
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
75 colend=$5
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
76 colref=$6
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
77 colobs=$7
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
78 addcols=$8 #e.g. "B.col1,B.col2"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
79
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
80 test="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
81
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
82 # echo "joining result with original file"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
83 if [ $test == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
84 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
85 echo "ofile: $ofile"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
86 head $ofile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
87 echo "rfile: $rfile"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
88 head $rfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
89 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
90 numlines=`wc $rfile | cut -d" " -f2`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
91
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
92 # if empty results file, just add header fields
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
93 if [[ ! -s $rfile ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
94 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
95 dummycol=${addcols:2}
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
96 outputcol=${dummycol//",B."/" "}
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
97 numcommas=`echo "$addcols" | grep -o "," | wc -l`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
98
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
99 awk 'BEGIN{FS="\t";OFS="\t"}{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
100 if(FNR==1)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
101 print $0,"'"$outputcol"'";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
102 else{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
103 printf $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
104 for(i=0;i<="'"$numcommas"'"+1;i++)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
105 printf "\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
106 printf "\n"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
107 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
108 }END{}' $ofile > tempofile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
109
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
110 mv tempofile $ofile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
111 return
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
112 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
113
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
114
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
115 #get input file column names for cgatools join
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
116 col_chr_name=`head -1 $rfile | cut -f${colchr}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
117 col_start_name=`head -1 $rfile | cut -f${colstart}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
118 col_end_name=`head -1 $rfile | cut -f${colend}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
119 col_ref_name=`head -1 $rfile | cut -f${colref}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
120 col_obs_name=`head -1 $rfile | cut -f${colobs}`
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
121
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
122 #get annotation file column names for cgatools join
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
123 chr_name=`head -1 $ofile | cut -f${chrcol}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
124 start_name=`head -1 $ofile | cut -f${startcol}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
125 end_name=`head -1 $ofile | cut -f${endcol}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
126 ref_name=`head -1 $ofile | cut -f${refcol}`
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
127 obs_name=`head -1 $ofile | cut -f${obscol}`
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
128
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
129 if [ $test == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
130 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
131 echo "input file"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
132 echo "chr col: $col_chr_name ($colchr)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
133 echo "start col: $col_start_name ($colstart)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
134 echo "end col: $col_end_name ($colend)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
135 echo "ref col: $col_ref_name ($colref)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
136 echo "obs col: $col_obs_name ($colobs)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
137 echo ""
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
138 echo "annotation file"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
139 echo "chr col: $chr_name ($chrcol)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
140 echo "start col: $start_name ($startcol)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
141 echo "end col: $end_name ($endcol)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
142 echo "ref col: $ref_name ($refcol)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
143 echo "obs col: $obs_name ($obscol)"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
144 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
145
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
146 #perform join
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
147 cgatools join --beta \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
148 --input $ofile $rfile \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
149 --output temporiginal \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
150 --match ${chr_name}:${col_chr_name} \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
151 --match ${start_name}:${col_start_name} \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
152 --match ${end_name}:${col_end_name} \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
153 --match ${ref_name}:${col_ref_name} \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
154 --match ${obs_name}:${col_obs_name} \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
155 --select A.*,$addcols \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
156 --always-dump \
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
157 --output-mode compact
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
158
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
159 #replace originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
160 sed -i 's/^>//g' temporiginal #join sometimes adds a '>' symbol to header
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
161 mv temporiginal originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
162
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
163 if [ $test == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
164 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
165 echo "joining complete"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
166 head originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
167 echo ""
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
168 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
169 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
170
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
171
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
172
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
173
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
174 #################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
175 #
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
176 # PARSE PARAMETERS
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
177 #
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
178 #################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
179
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
180
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
181 set -- `getopt -n$0 -u -a --longoptions="inputfile: buildver: humandb: varfile: VCF: chrcol: startcol: endcol: refcol: obscol: vartypecol: convertcoords: geneanno: hgvs: verdbsnp: tfbs: mce: cytoband: segdup: dgv: gwas: ver1000g: cg46: cg69: impactscores: newimpactscores: otherinfo: esp: exac03: exac03nonpsych: exac03nontcga: dbscsnv11: kaviar_20150923: hrcr1: mitimpact2: mitimpact24: dbnsfp30a: spidex: gonl: gerp: cosmic61: cosmic63: cosmic64: cosmic65: cosmic67: cosmic68: clinvar: nci60: outall: outfilt: outinvalid: scriptsdir: dorunannovar: dofilter: filt_dbsnp: filt1000GALL: filt1000GAFR: filt1000GAMR: filt1000GASN: filt1000GEUR: filtESP6500ALL: filtESP6500EA: filtESP6500AA: filtcg46: filtcg69: dummy:" "h:" "$@"` || usage
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
182 [ $# -eq 0 ] && usage
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
183
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
184
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
185
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
186 while [ $# -gt 0 ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
187 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
188 case "$1" in
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
189 --inputfile) infile=$2;shift;; # inputfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
190 --buildver) buildvertmp=$2;shift;; # hg18 or hg19
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
191 --humandb) humandbtmp=$2;shift;; # location of humandb database
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
192 --varfile) varfile=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
193 --VCF) vcf=$2;shift;; #Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
194 --chrcol) chrcol=$2;shift;; # which column has chr
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
195 --startcol) startcol=$2;shift;; # which column has start coord
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
196 --endcol) endcol=$2;shift;; # which column has end coord
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
197 --refcol) refcol=$2;shift;; # which column has ref allele
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
198 --obscol) obscol=$2;shift;; # which column has alt allele
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
199 --vartypecol) vartypecol=$2;shift;; # which column has vartype
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
200 --convertcoords) convertcoords=$2;shift;; # Y or N convert coordinate from CG to 1-based?
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
201 --geneanno) geneanno=$2;shift;; # comma-separated list of strings refSeq, knowngene, ensgene
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
202 --hgvs) hgvs=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
203 --verdbsnp) verdbsnp=$2;shift;; #comma-separated list of dbsnp version to annotate with (e.g. "132,135NonFlagged,137,138")"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
204 --tfbs) tfbs=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
205 --mce) mce=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
206 --cytoband) cytoband=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
207 --segdup) segdup=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
208 --dgv) dgv=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
209 --gwas) gwas=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
210 --ver1000g) ver1000g=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
211 --cg46) cg46=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
212 --cg69) cg69=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
213 --impactscores) impactscores=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
214 --newimpactscores) newimpactscores=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
215 --otherinfo) otherinfo=$2;shift;; # display additional columns?
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
216 --scriptsdir) scriptsdirtmp=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
217 --esp) esp=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
218 --exac03) exac03=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
219 --exac03nonpsych) exac03nonpsych=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
220 --exac03nontcga) exac03nontcga=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
221 --dbscsnv11) dbscsnv11=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
222 --kaviar_20150923) kaviar_20150923=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
223 --hrcr1) hrcr1=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
224 --mitimpact2) mitimpact2=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
225 --mitimpact24) mitimpact24=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
226 --dbnsfp30a) dbnsfp30a=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
227 --gonl) gonl=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
228 --spidex) spidex=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
229 --gerp) gerp=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
230 --cosmic61) cosmic61=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
231 --cosmic63) cosmic63=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
232 --cosmic64) cosmic64=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
233 --cosmic65) cosmic65=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
234 --cosmic67) cosmic67=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
235 --cosmic68) cosmic68=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
236 --nci60) nci60=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
237 --clinvar) clinvar=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
238 --filt_dbsnp) filt_dbsnp=$2;shift;; # Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
239 --filt1000GALL) threshold_1000g_ALL=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
240 --filt1000GAFR) threshold_1000g_AFR=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
241 --filt1000GAMR) threshold_1000g_AMR=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
242 --filt1000GASN) threshold_1000g_ASN=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
243 --filt1000GEUR) threshold_1000g_EUR=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
244 --filtESP6500ALL) threshold_ESP6500_ALL=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
245 --filtESP6500EA) threshold_ESP6500_EA=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
246 --filtESP6500AA) threshold_ESP6500_AA=$2;shift;; #threshold value
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
247 --filtcg46) threshold_cg46=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
248 --filtcg69) threshold_cg69=$2;shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
249 --outall) outfile_all=$2;shift;; # file
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
250 --outfilt) outfile_filt=$2;shift;; # file
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
251 --outinvalid) outfile_invalid=$2;shift;; #file
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
252 --dorunannovar) dorunannovar=$2;shift;; #Y or N
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
253 -h) shift;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
254 --) shift;break;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
255 -*) usage;;
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
256 *) break;;
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
257 esac
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
258 shift
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
259 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
260
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
261 #sometimes galaxy screws up these variables after updates, if comma-separated list, use only what is before first comma
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
262 humandb=${humandbtmp%,*}
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
263 buildver=${buildvertmp%,*}
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
264 scriptsdir=${scriptsdirtmp%,*}
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
265
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
266
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
267 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
268 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
269 echo "dorunannovar: $dorunannovar"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
270 echo "infile: $infile"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
271 echo "buildver: $buildver"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
272 echo "annovardb: $humandb"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
273 echo "verdbnsp: $verdbsnp"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
274 echo "geneanno: $geneanno"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
275 echo "tfbs: $tfbs"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
276 echo "mce: $mce"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
277 echo "cytoband: $cytoband"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
278 echo "segdup: $segdup"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
279 echo "dgv: $dgv"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
280 echo "gwas: $gwas"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
281 echo "g1000: ${g1000}"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
282 echo "cg46: ${cg46}"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
283 echo "cg69: ${cg69}"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
284 echo "impactscores: $impactscores"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
285 echo "impactscores: $newimpactscores"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
286 echo "esp: $esp"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
287 echo "gerp: $gerp"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
288 echo "cosmic: $cosmic"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
289 echo "outfile: $outfile_all"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
290 echo "outinvalid: $outfile_invalid"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
291 echo "outfiltered: $outfile_filt"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
292 echo "varfile: $varfile"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
293 echo "vcf" $vcf
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
294 echo "chrcol: $chrcol"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
295 echo "startcol: $startcol"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
296 echo "endcol: $endcol"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
297 echo "refcol: $refcol"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
298 echo "obscol: $obscol"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
299 echo "convertcoords: $convertcoords"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
300 echo "vartypecol: $vartypecol"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
301 echo "dofilter: $dofilter"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
302 echo "threshold_1000g_ALL : $threshold_1000g_ALL"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
303 echo "threshold_1000g_AFR : $threshold_1000g_AFR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
304 echo "threshold_1000g_AMR : $threshold_1000g_AMR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
305 echo "threshold_1000g_ASN : $threshold_1000g_ASN"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
306 echo "threshold_1000g_EUR : $threshold_1000g_EUR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
307 echo "threshold_ESP6500_ALL: $threshold_ESP6500_ALL"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
308 echo "threshold_ESP6500_EA : $threshold_ESP6500_EA"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
309 echo "threshold_ESP6500_AA : $threshold_ESP6500_AA"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
310 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
311
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
312
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
313
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
314 ############################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
315 #
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
316 # Annotate Variants
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
317 #
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
318 ############################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
319
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
320 # parse geneanno param
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
321 refgene="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
322 knowngene="N"
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
323 ensgene="N"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
324
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
325 if [[ $geneanno =~ "refSeq" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
326 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
327 refgene="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
328 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
329 if [[ $geneanno =~ "knowngene" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
330 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
331 knowngene="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
332 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
333 if [[ $geneanno =~ "ensgene" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
334 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
335 ensgene="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
336 fi
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
337 if [ $hgvs == "N" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
338 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
339 hgvs=""
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
340 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
341
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
342 #parse verdbsnp/1000g/esp strings
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
343 dbsnpstr=${verdbsnp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
344 filt_dbsnpstr=${filt_dbsnp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
345 g1000str=${ver1000g//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
346 espstr=${esp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
347
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
348 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
349 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
350 echo "annotate dbsnp: $dbsnpstr"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
351 echo "annotate esp: $espstr"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
352 echo "filter dbsnp: $filt_dbsnpstr"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
353 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
354
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
355 mutationtaster="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
356 avsift="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
357 lrt="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
358 polyphen2="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
359 phylop="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
360 ljbsift="N"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
361
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
362 #parse old impactscores param (obsolete)
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
363 if [[ $impactscores =~ "mutationtaster" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
364 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
365 mutationtaster="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
366 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
367 if [[ $impactscores =~ "sift" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
368 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
369 avsift="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
370 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
371 if [[ $impactscores =~ "lrt" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
372 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
373 lrt="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
374 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
375 if [[ $impactscores =~ "ljbsift" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
376 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
377 ljbsift="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
378 fi
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
379 if [[ $impactscores =~ "ljb2sift" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
380 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
381 ljb2sift="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
382 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
383 if [[ $impactscores =~ "pp2" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
384 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
385 polyphen2="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
386 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
387 if [[ $impactscores =~ "phylop" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
388 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
389 phylop="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
390 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
391
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
392 if [[ $varfile == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
393 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
394 convertcoords="Y"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
395 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
396
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
397 #ljb refers to Liu, Jian, Boerwinkle paper in Human Mutation with pubmed ID 21520341. Cite this paper if you use the scores
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
398
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
399 ljb2_sift="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
400 ljb2_pp2hdiv="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
401 ljb2_pp2hvar="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
402 ljb2_lrt="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
403 ljb2_mt="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
404 ljb2_ma="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
405 ljb2_fathmm="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
406 ljb2_gerp="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
407 ljb2_phylop="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
408 ljb2_siphy="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
409
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
410 # parse ljb2 newimpactscores param
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
411 # ljb2_sift, ljb2_pp2hdiv, ljb2_pp2hvar, ljb2_lrt, ljb2_mt, ljb2_ma, ljb2_fathmm, ljb2_gerp++, ljb2_phylop, ljb2_siphy
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
412 if [[ $newimpactscores =~ "ljb2_sift" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
413 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
414 ljb2_sift="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
415 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
416 if [[ $newimpactscores =~ "ljb2_pp2hdiv" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
417 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
418 ljb2_pp2hdiv="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
419 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
420 if [[ $newimpactscores =~ "ljb2_pp2hvar" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
421 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
422 ljb2_pp2hvar="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
423 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
424 if [[ $newimpactscores =~ "ljb2_lrt" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
425 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
426 ljb2_lrt="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
427 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
428 if [[ $newimpactscores =~ "ljb2_mt" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
429 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
430 ljb2_mt="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
431 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
432 if [[ $newimpactscores =~ "ljb2_ma" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
433 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
434 ljb2_ma="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
435 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
436 if [[ $newimpactscores =~ "ljb2_fathmm" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
437 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
438 ljb2_fathmm="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
439 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
440 if [[ $newimpactscores =~ "ljb2_gerp" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
441 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
442 ljb2_gerp="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
443 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
444 if [[ $newimpactscores =~ "ljb2_phylop" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
445 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
446 ljb2_phylop="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
447 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
448 if [[ $newimpactscores =~ "ljb2_siphy" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
449 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
450 ljb2_siphy="Y"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
451 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
452
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
453 if [ $otherinfo == "N" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
454 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
455 otherinfo=""
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
456 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
457
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
458
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
459 #column header names we will be adding
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
460 # ESP 6500
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
461 esp6500si_colheader_ALL="ESP6500si_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
462 esp6500si_colheader_EA="ESP6500si_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
463 esp6500si_colheader_AA="ESP6500si_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
464 esp6500_colheader_ALL="ESP6500_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
465 esp6500_colheader_EA="ESP6500_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
466 esp6500_colheader_AA="ESP6500_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
467 esp5400si_colheader_ALL="ESP5400si_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
468 esp5400si_colheader_EA="ESP5400si_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
469 esp5400si_colheader_AA="ESP5400si_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
470 esp5400_colheader_ALL="ESP5400_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
471 esp5400_colheader_EA="ESP5400_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
472 esp5400_colheader_AA="ESP5400_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
473
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
474
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
475 # cg46 cg69
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
476 cg46_colheader="CG_46_genomes"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
477 cg69_colheader="CG_69_genomes"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
478
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
479 cp $infile originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
480 #run annovar or filter only?
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
481 if [ $dorunannovar == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
482 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
483
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
484
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
485 ####################################
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
486 #
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
487 # PREPARE INPUT FILE
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
488 #
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
489 ####################################
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
490
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
491 echo "converting input file"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
492 vcfheader=""
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
493 if [ $vcf == "Y" ] #if CG varfile, convert
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
494 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
495 # convert vcf to annovarinput
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
496 $scriptsdir/convert2annovar.pl --format vcf4old --allallele --includeinfo --outfile annovarinput $infile 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
497
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
498 #construct header line from vcf file
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
499 cat $infile | grep "#CHROM" > additionalcols
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
500 sed -i 's/#//g' additionalcols
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
501 vcfheader="\t`cat additionalcols`"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
502 echo "vcfheader:$vcfheader"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
503 echo -e "chromosome\tbegin\tend\treference\tobserved\t`cat additionalcols`" > originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
504 cat annovarinput >> originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
505
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
506 chrcol=1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
507 startcol=2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
508 endcol=3
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
509 refcol=4
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
510 obscol=5
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
511
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
512
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
513 elif [ $varfile == "Y" ] #if CG varfile, convert
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
514 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
515 # convert varfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
516 $scriptsdir/convert2annovar.pl --format cg --outfile annovarinput $infile 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
517 echo -e "chromosome\tbegin\tend\treference\talleleSeq\tvarType\thaplotype" > originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
518 cat annovarinput | cut -f1-6,8 >> originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
519 cat annovarinput | cut -f1-5 >> annovarinput2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
520 mv annovarinput2 annovarinput
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
521
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
522 chrcol=1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
523 startcol=2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
524 endcol=3
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
525 refcol=4
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
526 obscol=5
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
527
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
528 elif [ $convertcoords == "Y" ] # if CG-coordinates, convert
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
529 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
530 #echo "rearranging columns and converting coordinates"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
531 awk 'BEGIN{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
532 FS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
533 OFS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
534 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
535 if(FNR>1) {
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
536 gsub(/chr/,"",$"'"${chrcol}"'")
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
537 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" += 1 };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
538 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "-" };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
539 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" +=1; $"'"${obscol}"'" = "-" };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
540 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" += 1 };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
541
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
542 printf("%s\t%s\t%s\t%s\t%s\n" ,$"'"${chrcol}"'",$"'"${startcol}"'",$"'"${endcol}"'",$"'"${refcol}"'",$"'"${obscol}"'");
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
543 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
544 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
545 END{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
546 }' $infile > annovarinput
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
547
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
548 #remove any "chr" prefixes
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
549 #sed -i '2,$s/chr//g' annovarinput
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
550
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
551 awk 'BEGIN{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
552 FS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
553 OFS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
554 }{
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
555
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
556 if(FNR>=1) {
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
557 gsub(/chr/,"",$"'"${chrcol}"'")
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
558 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" += 1 };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
559 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "-" };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
560 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" +=1; $"'"${obscol}"'" = "-" };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
561 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" += 1 };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
562
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
563 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
564 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
565 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
566 END{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
567 }' $infile > originalfile
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
568
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
569 #remove any "chr" prefixes
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
570 #sed -i '2,$s/chr//g' originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
571 sed -i 's/omosome/chromosome/g' originalfile
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
572
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
573
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
574 else #only rearrange columns if already 1-based coordinates
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
575 echo "rearranging columns "
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
576 awk 'BEGIN{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
577 FS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
578 OFS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
579 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
580 if(FNR>1) {
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
581 printf("%s\t%s\t%s\t%s\t%s\n",$"'"${chrcol}"'",$"'"${startcol}"'",$"'"${endcol}"'",$"'"${refcol}"'",$"'"${obscol}"'");
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
582 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
583 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
584 END{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
585 }' $infile > annovarinput
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
586
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
587 #remove any "chr" prefixes
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
588 sed -i '2,$s/chr//g' annovarinput
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
589 sed '2,$s/chr//g' $infile > originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
590 sed -i 's/omosome/chromosome/g' originalfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
591 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
592
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
593 echo "...finished conversion"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
594
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
595
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
596
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
597 ####################################
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
598 #
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
599 # RUN ANNOVAR COMMANDS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
600 #
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
601 ####################################
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
602
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
603
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
604
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
605 ###### gene-based annotation #######
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
606
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
607 # RefSeq Gene
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
608 if [ $refgene == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
609 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
610 echo -e "\nrefSeq gene"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
611 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype gene ${hgvs} annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
612
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
613 annovarout=annovarinput.variant_function
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
614 sed -i '1i\RefSeq_Func\tRefSeq_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
615 joinresults originalfile $annovarout 3 4 5 6 7 B.RefSeq_Func,B.RefSeq_Gene
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
616
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
617 annovarout=annovarinput.exonic_variant_function
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
618 sed -i '1i\linenum\tRefSeq_ExonicFunc\tRefSeq_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
619 joinresults originalfile $annovarout 4 5 6 7 8 B.RefSeq_ExonicFunc,B.RefSeq_AAChange
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
620 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
621
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
622
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
623 # UCSC KnownGene
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
624 if [ $knowngene == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
625 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
626 echo -e "\nUCSC known gene"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
627 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype knowngene annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
628
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
629 annovarout=annovarinput.variant_function
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
630 sed -i '1i\UCSCKnownGene_Func\tUCSCKnownGene_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
631 joinresults originalfile $annovarout 3 4 5 6 7 B.UCSCKnownGene_Func,B.UCSCKnownGene_Gene
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
632
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
633 annovarout=annovarinput.exonic_variant_function
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
634 sed -i '1i\linenum\tUCSCKnownGene_ExonicFunc\tUCSCKnownGene_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
635 joinresults originalfile $annovarout 4 5 6 7 8 B.UCSCKnownGene_ExonicFunc,B.UCSCKnownGene_AAChange
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
636 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
637
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
638
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
639 # Emsembl Gene
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
640 if [ $ensgene == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
641 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
642 echo -e "\nEnsembl gene"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
643 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype ensgene annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
644
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
645 annovarout=annovarinput.variant_function
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
646 sed -i '1i\EnsemblGene_Func\tEnsemblGene_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
647 joinresults originalfile $annovarout 3 4 5 6 7 B.EnsemblGene_Func,B.EnsemblGene_Gene
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
648
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
649 annovarout=annovarinput.exonic_variant_function
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
650 sed -i '1i\linenum\tEnsemblGene_ExonicFunc\tEnsemblGene_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
651 joinresults originalfile $annovarout 4 5 6 7 8 B.EnsemblGene_ExonicFunc,B.EnsemblGene_AAChange
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
652 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
653
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
654
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
655
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
656 ###### region-based annotation #######
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
657
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
658
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
659 # Transcription Factor Binding Sites Annotation
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
660 if [ $mce == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
661 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
662 echo -e "\nMost Conserved Elements"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
663
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
664 if [ $buildver == "hg18" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
665 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
666 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype mce44way annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
667 annovarout=annovarinput.${buildver}_phastConsElements44way
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
668 sed -i '1i\db\tphastConsElements44way\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
669 joinresults originalfile $annovarout 3 4 5 6 7 B.phastConsElements44way
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
670
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
671 else #hg19
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
672 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype mce46way annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
673 annovarout=annovarinput.${buildver}_phastConsElements46way
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
674 sed -i '1i\db\tphastConsElements46way\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
675 joinresults originalfile $annovarout 3 4 5 6 7 B.phastConsElements46way
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
676 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
677
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
678 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
679
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
680
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
681
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
682 # Transcription Factor Binding Sites Annotation
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
683 if [ $tfbs == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
684 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
685 echo -e "\nTranscription Factor Binding Site Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
686 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype tfbs annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
687
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
688 # arguments: originalfile, resultfile,chrcol,startcol,endcol,refcol,obscol,selectcolumns
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
689 annovarout=annovarinput.${buildver}_tfbsConsSites
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
690 sed -i '1i\db\tTFBS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
691 joinresults originalfile $annovarout 3 4 5 6 7 B.TFBS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
692 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
693
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
694
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
695
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
696 # Identify cytogenetic band for genetic variants
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
697 if [ $cytoband == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
698 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
699 echo -e "\nCytogenic band Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
700 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype band annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
701
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
702 annovarout=annovarinput.${buildver}_cytoBand
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
703 sed -i '1i\db\tBand\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
704 joinresults originalfile $annovarout 3 4 5 6 7 B.Band
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
705 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
706
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
707
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
708 # Identify variants located in segmental duplications
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
709 if [ $segdup == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
710 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
711 echo -e "\nSegmental Duplications Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
712 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype segdup annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
713
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
714 annovarout=annovarinput.${buildver}_genomicSuperDups
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
715 sed -i '1i\db\tSegDup\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
716 joinresults originalfile $annovarout 3 4 5 6 7 B.SegDup
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
717 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
718
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
719
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
720
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
721 # Identify previously reported structural variants in DGV
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
722 if [ $dgv == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
723 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
724 echo -e "\nDGV Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
725 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype dgvMerged annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
726
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
727 annovarout=annovarinput.${buildver}_dgvMerged
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
728 sed -i '1i\db\tDGV\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
729 joinresults originalfile $annovarout 3 4 5 6 7 B.DGV
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
730 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
731
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
732
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
733 # Identify variants reported in previously published GWAS studies
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
734 if [ $gwas == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
735 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
736 echo -e "\nGWAS Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
737 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype gwascatalog annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
738
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
739 annovarout=annovarinput.${buildver}_gwasCatalog
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
740 sed -i '1i\db\tGWAS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
741 joinresults originalfile $annovarout 3 4 5 6 7 B.GWAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
742 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
743
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
744
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
745
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
746
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
747 ###### filter-based annotation #######
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
748
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
749 #dbSNP
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
750 for version in $dbsnpstr
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
751 do
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
752 if [ $version == "None" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
753 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
754 break
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
755 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
756 echo -e "\ndbSNP region Annotation, version: $version"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
757 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ${version} annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
758
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
759 columnname=${version}
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
760 if [[ $columnname == snp* ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
761 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
762 columnname="db${version}"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
763 fi
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
764
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
765 annovarout=annovarinput.${buildver}_${version}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
766 sed -i '1i\db\t'${columnname}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
767 joinresults originalfile $annovarout 3 4 5 6 7 B.${columnname}
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
768
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
769 done
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
770
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
771
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
772
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
773 #1000 Genomes
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
774
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
775 if [ $ver1000g != "None" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
776 then
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
777
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
778 for version in $g1000str
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
779 do
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
780 #column headers
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
781 g1000_colheader_ALL="${version}_ALL"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
782 g1000_colheader_AFR="${version}_AFR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
783 g1000_colheader_AMR="${version}_AMR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
784 g1000_colheader_ASN="${version}_ASN"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
785 g1000_colheader_EUR="${version}_EUR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
786 g1000_colheader_EAS="${version}_EAS"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
787 g1000_colheader_SAS="${version}_SAS"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
788 g1000_colheader_CEU="${version}_CEU"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
789 g1000_colheader_YRI="${version}_YRI"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
790 g1000_colheader_JPTCHB="${version}_JPTCHB"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
791
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
792 doALL="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
793 doAMR="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
794 doAFR="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
795 doASN="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
796 doEAS="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
797 doSAS="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
798 doEUR="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
799 doCEU="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
800 doYRI="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
801 doJPTCHB="N"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
802
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
803
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
804 if [ $version == "1000g2012apr" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
805 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
806 fileID="2012_04"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
807 doALL="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
808 if [ $buildver == "hg19" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
809 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
810 doAMR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
811 doAFR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
812 doASN="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
813 doEUR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
814 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
815 elif [ $version == "1000g2014oct" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
816 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
817 fileID="2014_10"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
818 doALL="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
819 doAMR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
820 doAFR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
821 doEUR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
822 doEAS="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
823 if [ $buildver == "hg19" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
824 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
825 doSAS="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
826 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
827
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
828 elif [[ $version == "1000g2015aug" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
829 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
830 fileID="2015_08"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
831 doALL="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
832 doAMR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
833 doAFR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
834 doEUR="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
835 doEAS="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
836 doSAS="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
837
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
838 elif [[ $version == "1000g2012feb" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
839 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
840 fileID="2012_02"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
841 doALL="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
842 elif [[ $version == "1000g2010nov" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
843 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
844 fileID="2010_11"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
845 doALL="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
846 elif [[ $version == "1000g2010jul" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
847 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
848 fileID="2010_07"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
849 doALL="N"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
850 doCEU="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
851 doYRI="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
852 doJPTCHB="Y"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
853 else
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
854 echo "unrecognized 1000g version, skipping"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
855 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
856
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
857 #ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
858 if [ $doALL == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
859 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
860 echo -e "\n1000Genomes ALL"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
861 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_all" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
862
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
863 annovarout=annovarinput.${buildver}_ALL.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
864 sed -i '1i\db\t'$g1000_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
865 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
866 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
867
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
868 # AFR
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
869 if [ $doAFR == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
870 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
871 echo -e "\n1000Genomes AFR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
872 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_afr" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
873
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
874 annovarout=annovarinput.${buildver}_AFR.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
875 sed -i '1i\db\t'$g1000_colheader_AFR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
876 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_AFR
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
877 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
878
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
879
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
880 # AMR
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
881 if [ $doAMR == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
882 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
883 echo -e "\n1000Genomes AMR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
884 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_amr" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
885
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
886 annovarout=annovarinput.${buildver}_AMR.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
887 sed -i '1i\db\t'$g1000_colheader_AMR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
888 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_AMR
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
889 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
890
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
891 # ASN
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
892 if [ $doASN == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
893 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
894 echo -e "\n1000Genomes ASN"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
895 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_asn" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
896
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
897 annovarout=annovarinput.${buildver}_ASN.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
898 sed -i '1i\db\t'$g1000_colheader_ASN'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
899 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_ASN
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
900 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
901
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
902 # EAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
903 if [ $doEAS == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
904 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
905 echo -e "\n1000Genomes EAS"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
906 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_eas" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
907
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
908 annovarout=annovarinput.${buildver}_EAS.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
909 sed -i '1i\db\t'$g1000_colheader_EAS'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
910 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_EAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
911 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
912
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
913 # SAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
914 if [ $doSAS == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
915 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
916 echo -e "\n1000Genomes SAS"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
917 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_sas" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
918
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
919 annovarout=annovarinput.${buildver}_SAS.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
920 sed -i '1i\db\t'$g1000_colheader_SAS'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
921 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_SAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
922 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
923
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
924 # EUR
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
925 if [ $doEUR == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
926 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
927 echo -e "\n1000Genomes EUR"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
928 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_eur" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
929
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
930 annovarout=annovarinput.${buildver}_EUR.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
931 sed -i '1i\db\t'$g1000_colheader_EUR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
932 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_EUR
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
933 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
934
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
935 # CEU
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
936 if [ $doCEU == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
937 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
938 echo -e "\n1000Genomes CEU"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
939 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_ceu" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
940
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
941 annovarout=annovarinput.${buildver}_CEU.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
942 sed -i '1i\db\t'$g1000_colheader_CEU'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
943 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_CEU
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
944 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
945
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
946 # YRI
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
947 if [ $doYRI == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
948 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
949 echo -e "\n1000Genomes YRI"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
950 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_yri" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
951
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
952 annovarout=annovarinput.${buildver}_YRI.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
953 sed -i '1i\db\t'$g1000_colheader_YRI'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
954 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_YRI
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
955
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
956
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
957 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
958
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
959 #JPTCHB
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
960 if [ $doJPTCHB == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
961 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
962 echo -e "\n1000Genomes JPTCHB"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
963 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_jptchb" annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
964
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
965 annovarout=annovarinput.${buildver}_JPTCHB.sites.${fileID}_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
966 sed -i '1i\db\t'$g1000_colheader_JPTCHB'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
967 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_JPTCHB
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
968 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
969
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
970 done
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
971 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
972
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
973
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
974
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
975
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
976 #### IMPACT SCORE ANNOTATIONS
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
977
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
978
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
979 if [ $ljb2_sift == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
980 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
981 echo -e "\nLJB2 SIFT Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
982 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_sift annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
983
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
984 annovarout=annovarinput.${buildver}_ljb2_sift_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
985 sed -i '1i\db\tLJB2_SIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
986 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_SIFT
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
987 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
988
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
989 if [ $ljb2_pp2hdiv == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
990 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
991 echo -e "\nLJB2 pp2hdiv Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
992 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_pp2hdiv annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
993
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
994 annovarout=annovarinput.${buildver}_ljb2_pp2hdiv_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
995 sed -i '1i\db\tLJB2_PolyPhen2_HDIV\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
996 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_PolyPhen2_HDIV
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
997 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
998
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
999 if [ $ljb2_pp2hvar == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1000 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1001 echo -e "\nLJB2 pp2hvar Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1002 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_pp2hvar annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1003
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1004 annovarout=annovarinput.${buildver}_ljb2_pp2hvar_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1005
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1006 head $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1007 sed -i '1i\db\tLJB2_PolyPhen2_HVAR\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1008 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_PolyPhen2_HVAR
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1009 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1010
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1011 if [ $ljb2_lrt == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1012 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1013 echo -e "\nLJB2 LRT Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1014 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_lrt annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1015
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1016 annovarout=annovarinput.${buildver}_ljb2_lrt_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1017 sed -i '1i\db\tLJB2_LRT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1018 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_LRT
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1019 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1020
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1021 if [ $ljb2_mt == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1022 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1023 echo -e "\nLJB2 mutationtaster Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1024 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_mt annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1025
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1026 annovarout=annovarinput.${buildver}_ljb2_mt_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1027 sed -i '1i\db\tLJB2_MutationTaster\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1028 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_MutationTaster
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1029 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1030
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1031 if [ $ljb2_ma == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1032 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1033 echo -e "\nLJB2 mutationassessor Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1034 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_ma annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1035
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1036 annovarout=annovarinput.${buildver}_ljb2_ma_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1037 sed -i '1i\db\tLJB2_MutationAssessor\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1038 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_MutationAssessor
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1039 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1040
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1041 if [ $ljb2_fathmm == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1042 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1043 echo -e "\nLJB2 FATHMM Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1044 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_fathmm annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1045
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1046 annovarout=annovarinput.${buildver}_ljb2_fathmm_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1047 sed -i '1i\db\tLJB2_FATHMM\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1048 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_FATHMM
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1049 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1050
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1051 if [ $ljb2_gerp == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1052 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1053 echo -e "\nLJB2 GERP++ Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1054 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_gerp++ annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1055
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1056 annovarout=annovarinput.${buildver}_ljb2_gerp++_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1057 sed -i '1i\db\tLJB2_GERP++\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1058 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_GERP++
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1059 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1060
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1061 if [ $ljb2_phylop == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1062 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1063 echo -e "\nLJB2 PhyloP Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1064 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_phylop annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1065
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1066 annovarout=annovarinput.${buildver}_ljb2_phylop_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1067 sed -i '1i\db\tLJB2_PhyloP\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1068 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_PhyloP
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1069 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1070
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1071 if [ $ljb2_siphy == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1072 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1073 echo -e "\nLJB2 SiPhy Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1074 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_siphy annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1075
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1076 annovarout=annovarinput.${buildver}_ljb2_siphy_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1077 sed -i '1i\db\tLJB2_SiPhy\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1078 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_SiPhy
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1079 fi
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1080
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1081
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1082
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1083 ### OLD IMPACT SCORE ANNOTATIONS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1084
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1085 # SIFT
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1086 if [ $avsift == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1087 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1088 echo -e "\nSIFT Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1089 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype avsift annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1090
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1091 annovarout=annovarinput.${buildver}_avsift_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1092 sed -i '1i\db\tAVSIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1093 joinresults originalfile $annovarout 3 4 5 6 7 B.AVSIFT
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1094 fi
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1095
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1096 #ljb refers to Liu, Jian, Boerwinkle paper in Human Mutation with pubmed ID 21520341. Cite this paper if you use the scores
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1097 # SIFT2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1098 if [ $ljbsift == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1099 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1100 echo -e "\nLJB SIFT Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1101 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_sift annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1102
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1103 annovarout=annovarinput.${buildver}_ljb_sift_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1104 sed -i '1i\db\tLJB_SIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1105 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB_SIFT
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1106 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1107
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1108
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1109 # PolyPhen2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1110 if [ $polyphen2 == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1111 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1112 echo -e "\nPolyPhen Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1113 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_pp2 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1114
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1115 annovarout=annovarinput.${buildver}_ljb_pp2_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1116 sed -i '1i\db\tPolyPhen2\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1117 joinresults originalfile $annovarout 3 4 5 6 7 B.PolyPhen2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1118 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1119
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1120
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1121 # MutationTaster
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1122 if [ $mutationtaster == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1123 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1124 echo -e "\nMutationTaster Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1125 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_mt annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1126
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1127 annovarout=annovarinput.${buildver}_ljb_mt_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1128 sed -i '1i\db\tMutationTaster\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1129 joinresults originalfile $annovarout 3 4 5 6 7 B.MutationTaster
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1130 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1131
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1132
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1133 # LRT
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1134 if [ $lrt == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1135 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1136 echo -e "\nLRT Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1137 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_lrt annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1138
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1139 annovarout=annovarinput.${buildver}_ljb_lrt_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1140 sed -i '1i\db\tLikelihoodRatioTestScore\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1141 joinresults originalfile $annovarout 3 4 5 6 7 B.LikelihoodRatioTestScore
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1142 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1143
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1144 # PhyloP
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1145 if [ $phylop == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1146 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1147 echo -e "\nPhyloP Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1148 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_phylop annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1149
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1150 annovarout=annovarinput.${buildver}_ljb_phylop_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1151 sed -i '1i\db\tPhyloP\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1152 joinresults originalfile $annovarout 3 4 5 6 7 B.PhyloP
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1153 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1154
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1155
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1156 ### ESP Exome Variant Server
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1157 if [ $esp != "None" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1158 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1159 echo -e "\nESP Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1160 for version in $espstr
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1161 do
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1162 echo "version: $version"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1163 # 6500si ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1164 if [ $version == "esp6500si_all" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1165 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1166 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_all annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1167
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1168 annovarout=annovarinput.${buildver}_esp6500si_all_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1169 sed -i '1i\db\t'$esp6500si_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1170 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1171 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1172
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1173
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1174 # 6500si European American
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1175 if [ $version == "esp6500si_ea" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1176 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1177 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_ea annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1178
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1179 annovarout=annovarinput.${buildver}_esp6500si_ea_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1180 sed -i '1i\db\t'$esp6500si_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1181 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_EA
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1182 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1183
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1184 # 6500si African Americans
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1185 if [ $version == "esp6500si_aa" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1186 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1187 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_aa annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1188
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1189 annovarout=annovarinput.${buildver}_esp6500si_aa_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1190 sed -i '1i\db\t'$esp6500si_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1191 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_AA
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1192 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1193
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1194
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1195 # 6500 ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1196 if [ $version == "esp6500_all" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1197 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1198 ls
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1199 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_all annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1200
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1201 annovarout=annovarinput.${buildver}_esp6500_all_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1202 sed -i '1i\db\t'$esp6500_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1203 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1204 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1205
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1206
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1207 # 6500 European American
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1208 if [ $version == "esp6500_ea" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1209 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1210 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_ea annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1211 annovarout=annovarinput.${buildver}_esp6500_ea_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1212 sed -i '1i\db\t'$esp6500_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1213 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_EA
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1214 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1215
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1216 # 6500 African Americans
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1217 if [ $version == "esp6500_aa" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1218 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1219 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_aa annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1220
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1221 annovarout=annovarinput.${buildver}_esp6500_aa_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1222 sed -i '1i\db\t'$esp6500_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1223 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_AA
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1224 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1225
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1226
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1227 # 5400 ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1228 if [ $version == "esp5400_all" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1229 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1230 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_all annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1231
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1232 annovarout=annovarinput.${buildver}_esp5400_all_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1233 sed -i '1i\db\t'$esp5400_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1234 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_ALL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1235 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1236
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1237
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1238 # 5400 European American
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1239 if [ $version == "esp5400_ea" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1240 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1241 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_ea annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1242
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1243 annovarout=annovarinput.${buildver}_esp5400_ea_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1244 sed -i '1i\db\t'$esp5400_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1245 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_EA
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1246 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1247
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1248 # 5400 African Americans
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1249 if [ $version == "esp5400_aa" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1250 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1251 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_aa annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1252
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1253 annovarout=annovarinput.${buildver}_esp5400_aa_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1254 sed -i '1i\db\t'$esp5400_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1255 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_AA
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1256 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1257
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1258 done
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1259 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1260
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1261 #ExAC-03 database
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1262 if [ $exac03 == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1263 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1264 echo -e "\nExAC03 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1265 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver --otherinfo -dbtype exac03 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1266
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1267 #annovarout=annovarinput.${buildver}_exac03_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1268
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1269 # split allelefrequency column into several columns, one per population
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1270 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1271 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1272 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1273 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1274 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1275 }END{}' annovarinput.${buildver}_exac03_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1276
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1277 sed -i '1i\db\tExAC_ALL\tExAC_AFR\tExAC_AMR\tExAC_EAS\tExAC_FIN\tExAC_NFE\tExAC_OTH\tExAC_SAS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1278 joinresults originalfile $annovarout 10 11 12 13 14 B.ExAC_ALL,B.ExAC_AFR,B.ExAC_AMR,B.ExAC_EAS,B.ExAC_FIN,B.ExAC_NFE,B.ExAC_OTH,B.ExAC_SAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1279 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1280
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1281 #ExAC-03 database
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1282 if [ $exac03nonpsych == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1283 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1284 echo -e "\nExAC03 non-psych Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1285 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver --otherinfo -dbtype exac03nonpsych annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1286
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1287 #annovarout=annovarinput.${buildver}_exac03_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1288
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1289 # split allelefrequency column into several columns, one per population
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1290 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1291 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1292 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1293 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1294 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1295 }END{}' annovarinput.${buildver}_exac03nonpsych_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1296
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1297 sed -i '1i\db\tExAC_non-phsych_ALL\tExAC_non-phsych_AFR\tExAC_non-phsych_AMR\tExAC_non-phsych_EAS\tExAC_non-phsych_FIN\tExAC_non-phsych_NFE\tExAC_non-phsych_OTH\tExAC_non-phsych_SAS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1298 joinresults originalfile $annovarout 10 11 12 13 14 B.ExAC_non-phsych_ALL,B.ExAC_non-phsych_AFR,B.ExAC_non-phsych_AMR,B.ExAC_non-phsych_EAS,B.ExAC_non-phsych_FIN,B.ExAC_non-phsych_NFE,B.ExAC_non-phsych_OTH,B.ExAC_non-phsych_SAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1299 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1300
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1301 #ExAC-03 database
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1302 if [ $exac03nontcga == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1303 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1304 echo -e "\nExAC03 non-tcga Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1305 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver --otherinfo -dbtype exac03nontcga annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1306
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1307 #annovarout=annovarinput.${buildver}_exac03_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1308
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1309 # split allelefrequency column into several columns, one per population
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1310 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1311 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1312 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1313 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1314 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1315 }END{}' annovarinput.${buildver}_exac03nontcga_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1316
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1317 sed -i '1i\db\tExAC_non-TCGA_ALL\tExAC_non-TCGA_AFR\tExAC_non-TCGA_AMR\tExAC_non-TCGA_EAS\tExAC_non-TCGA_FIN\tExAC_non-TCGA_NFE\tExAC_non-TCGA_OTH\tExAC_non-TCGA_SAS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1318 joinresults originalfile $annovarout 10 11 12 13 14 B.ExAC_non-TCGA_ALL,B.ExAC_non-TCGA_AFR,B.ExAC_non-TCGA_AMR,B.ExAC_non-TCGA_EAS,B.ExAC_non-TCGA_FIN,B.ExAC_non-TCGA_NFE,B.ExAC_non-TCGA_OTH,B.ExAC_non-TCGA_SAS
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1319 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1320
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1321 #dbscSNV 1.1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1322 if [ $dbscsnv11 == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1323 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1324 echo -e "\ndbscSNV11 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1325 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver -dbtype dbscsnv11 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1326
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1327 #annovarout="annovarinput.${buildver}_dbscsnv11_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1328 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1329 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1330 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1331 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1332 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1333 }END{}' annovarinput.${buildver}_dbscsnv11_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1334
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1335 sed -i '1i\db\tdbscSNV11_ADA_SCORE\tdbscSNV11_RF_SCORE\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1336 joinresults originalfile $annovarout 4 5 6 7 8 B.dbscSNV11_ADA_SCORE,B.dbscSNV11_RF_SCORE
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1337 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1338
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1339
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1340 #kaviar_20150923
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1341 if [ $kaviar_20150923 == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1342 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1343 echo -e "\nkaviar_20150923 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1344 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver -dbtype kaviar_20150923 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1345
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1346 #annovarout="annovarinput.${buildver}_kaviar_20150923_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1347 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1348 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1349 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1350 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1351 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1352 }END{}' annovarinput.${buildver}_kaviar_20150923_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1353
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1354 sed -i '1i\db\tKaviar_AF\tKaviar_AC\tKaviar_AN\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1355 joinresults originalfile $annovarout 5 6 7 8 9 B.Kaviar_AF,B.Kaviar_AC,B.Kaviar_AN
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1356 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1357
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1358 #hrcr1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1359 if [ $hrcr1 == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1360 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1361 echo -e "\nhrcr1 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1362 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver -dbtype hrcr1 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1363
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1364 #annovarout="annovarinput.${buildver}_dbscsnv11_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1365 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1366 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1367 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1368 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1369 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1370 }END{}' annovarinput.${buildver}_hrcr1_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1371 sed -i '1i\db\tHRC_AF\tHRC_AC\tHRC_AN\tHRC_non1000G_AF\tHRC_non1000G_AC\tHRC_non1000g_AN\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1372 joinresults originalfile $annovarout 8 9 10 11 12 B.HRC_AF,B.HRC_AC,B.HRC_AN,B.HRC_non1000g_AF,B.HRC_non1000g_AC,B.HRC_non1000g_AN
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1373 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1374
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1375 #dbnsfp30a
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1376 if [ $dbnsfp30a == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1377 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1378 echo -e "\ndbnsfp30a Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1379 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver -dbtype dbnsfp30a annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1380
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1381 #annovarout="annovarinput.${buildver}_dbnsfp30a_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1382 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1383 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1384 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1385 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1386 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1387 }END{}' annovarinput.${buildver}_dbnsfp30a_dropped > $annovarout
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1388
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1389 sed -i '1i\db\tdbNSFP_SIFT_score\tdbNSFP_SIFT_pred\tdbNSFP_Polyphen2_HDIV_score\tdbNSFP_Polyphen2_HDIV_pred\tdbNSFP_Polyphen2_HVAR_score\tdbNSFP_Polyphen2_HVAR_pred\tdbNSFP_LRT_score\tdbNSFP_LRT_pred\tdbNSFP_MutationTaster_score\tdbNSFP_MutationTaster_pred\tdbNSFP_MutationAssessor_score\tdbNSFP_MutationAssessor_pred\tdbNSFP_FATHMM_score\tdbNSFP_FATHMM_pred\tdbNSFP_PROVEAN_score\tdbNSFP_PROVEAN_pred\tdbNSFP_VEST3_score\tdbNSFP_CADD_raw\tdbNSFP_CADD_phredDANN_score\tdbNSFP_fathmm-MKL_coding_score\tdbNSFP_fathmm-MKL_coding_pred\tdbNSFP_MetaSVM_score\tdbNSFP_MetaSVM_pred\tdbNSFP_MetaLR_score\tdbNSFP_MetaLR_pred\tdbNSFP_integrated_fitCons_score\tdbNSFP_integrated_confidence_value\tdbNSFP_GERP_RS\tdbNSFP_phyloP7way_vertebrate\tdbNSFP_phyloP20way_mammalian\tdbNSFP_phastCons7way_vertebrate\tdbNSFP_phastCons20way_mammalian\tdbNSFP_SiPhy_29way_logOdds\tdbNSFP_unknown\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1390 joinresults originalfile $annovarout 36 37 38 39 40 B.dbNSFP_SIFT_score,B.dbNSFP_SIFT_pred,B.dbNSFP_Polyphen2_HDIV_score,B.dbNSFP_Polyphen2_HDIV_pred,B.dbNSFP_Polyphen2_HVAR_score,B.dbNSFP_Polyphen2_HVAR_pred,B.dbNSFP_LRT_score,B.dbNSFP_LRT_pred,B.dbNSFP_MutationTaster_score,B.dbNSFP_MutationTaster_pred,B.dbNSFP_MutationAssessor_score,B.dbNSFP_MutationAssessor_pred,B.dbNSFP_FATHMM_score,B.dbNSFP_FATHMM_pred,B.dbNSFP_PROVEAN_score,B.dbNSFP_PROVEAN_pred,B.dbNSFP_VEST3_score,B.dbNSFP_CADD_raw,B.dbNSFP_CADD_phredDANN_score,B.dbNSFP_fathmm-MKL_coding_score,B.dbNSFP_fathmm-MKL_coding_pred,B.dbNSFP_MetaSVM_score,B.dbNSFP_MetaSVM_pred,B.dbNSFP_MetaLR_score,B.dbNSFP_MetaLR_pred,B.dbNSFP_integrated_fitCons_score,B.dbNSFP_integrated_confidence_value,B.dbNSFP_GERP_RS,B.dbNSFP_phyloP7way_vertebrate,B.dbNSFP_phyloP20way_mammalian,B.dbNSFP_phastCons7way_vertebrate,B.dbNSFP_phastCons20way_mammalian,B.dbNSFP_SiPhy_29way_logOdds
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1391
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1392 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1393
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1394 #mitimpact2
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1395 if [ $mitimpact2 == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1396 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1397 echo -e "\nmitimpact2 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1398 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver -dbtype mitimpact2 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1399
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1400 #annovarout="annovarinput.${buildver}_mitimpact2_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1401 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1402 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1403 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1404 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1405 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1406 }END{}' annovarinput.${buildver}_mitimpact2_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1407
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1408 sed -i '1i\db\tMITimpact2_Gene_symbol\tMITimpact2_OXPHOS_Complex\tMITimpact2_Ensembl_Gene_ID\tMITimpact2_Ensembl_Protein_ID\tMITimpact2_Uniprot_Name\tMITimpact2_Uniprot_ID\tMITimpact2_NCBI_Gene_ID\tMITimpact2_NCBI_Protein_ID\tMITimpact2_Gene_pos\tMITimpact2_AA_pos\tMITimpact2_AA_sub\tMITimpact2_Codon_sub\tMITimpact2_dbSNP_ID\tMITimpact2_PhyloP_46V\tMITimpact2_PhastCons_46V\tMITimpact2_PhyloP_100V\tMITimpact2_PhastCons_100V\tMITimpact2_SiteVar\tMITimpact2_PolyPhen2_prediction\tMITimpact2_PolyPhen2_score\tMITimpact2_SIFT_prediction\tMITimpact2_SIFT_score\tMITimpact2_FatHmm_prediction\tMITimpact2_FatHmm_score\tMITimpact2_PROVEAN_prediction\tMITimpact2_PROVEAN_score\tMITimpact2_MutAss_prediction\tMITimpact2_MutAss_score\tMITimpact2_EFIN_Swiss_Prot_Score\tMITimpact2_EFIN_Swiss_Prot_Prediction\tMITimpact2_EFIN_HumDiv_Score\tMITimpact2_EFIN_HumDiv_Prediction\tMITimpact2_CADD_score\tMITimpact2_CADD_Phred_score\tMITimpact2_CADD_prediction\tMITimpact2_Carol_prediction\tMITimpact2_Carol_score\tMITimpact2_Condel_score\tMITimpact2_Condel_pred\tMITimpact2_COVEC_WMV\tMITimpact2_COVEC_WMV_prediction\tMITimpact2_PolyPhen2_score_transf\tMITimpact2_PolyPhen2_pred_transf\tMITimpact2_SIFT_score_transf\tMITimpact2_SIFT_pred_transf\tMITimpact2_MutAss_score_transf\tMITimpact2_MutAss_pred_transf\tMITimpact2_Perc_coevo_Sites\tMITimpact2_Mean_MI_score\tMITimpact2_COSMIC_ID\tMITimpact2_Tumor_site\tMITimpact2_Examined_samples\tMITimpact2_Mutation_frequency\tMITimpact2_US\tMITimpact2_Status\tMITimpact2_Associated_disease\tMITimpact2_Presence_in_TD\tMITimpact2_Class_predicted\tMITimpact2_Prob_N\tMITimpact2_Prob_P\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1409 joinresults originalfile $annovarout 62 63 64 65 66 B.MITimpact2_Gene_symbol,B.MITimpact2_OXPHOS_Complex,B.MITimpact2_Ensembl_Gene_ID,B.MITimpact2_Ensembl_Protein_ID,B.MITimpact2_Uniprot_Name,B.MITimpact2_Uniprot_ID,B.MITimpact2_NCBI_Gene_ID,B.MITimpact2_NCBI_Protein_ID,B.MITimpact2_Gene_pos,B.MITimpact2_AA_pos,B.MITimpact2_AA_sub,B.MITimpact2_Codon_sub,B.MITimpact2_dbSNP_ID,B.MITimpact2_PhyloP_46V,B.MITimpact2_PhastCons_46V,B.MITimpact2_PhyloP_100V,B.MITimpact2_PhastCons_100V,B.MITimpact2_SiteVar,B.MITimpact2_PolyPhen2_prediction,B.MITimpact2_PolyPhen2_score,B.MITimpact2_SIFT_prediction,B.MITimpact2_SIFT_score,B.MITimpact2_FatHmm_prediction,B.MITimpact2_FatHmm_score,B.MITimpact2_PROVEAN_prediction,B.MITimpact2_PROVEAN_score,B.MITimpact2_MutAss_prediction,B.MITimpact2_MutAss_score,B.MITimpact2_EFIN_Swiss_Prot_Score,B.MITimpact2_EFIN_Swiss_Prot_Prediction,B.MITimpact2_EFIN_HumDiv_Score,B.MITimpact2_EFIN_HumDiv_Prediction,B.MITimpact2_CADD_score,B.MITimpact2_CADD_Phred_score,B.MITimpact2_CADD_prediction,B.MITimpact2_Carol_prediction,B.MITimpact2_Carol_score,B.MITimpact2_Condel_score,B.MITimpact2_Condel_pred,B.MITimpact2_COVEC_WMV,B.MITimpact2_COVEC_WMV_prediction,B.MITimpact2_PolyPhen2_score_transf,B.MITimpact2_PolyPhen2_pred_transf,B.MITimpact2_SIFT_score_transf,B.MITimpact2_SIFT_pred_transf,B.MITimpact2_MutAss_score_transf,B.MITimpact2_MutAss_pred_transf,B.MITimpact2_Perc_coevo_Sites,B.MITimpact2_Mean_MI_score,B.MITimpact2_COSMIC_ID,B.MITimpact2_Tumor_site,B.MITimpact2_Examined_samples,B.MITimpact2_Mutation_frequency,B.MITimpact2_US,B.MITimpact2_Status,B.MITimpact2_Associated_disease,B.MITimpact2_Presence_in_TD,B.MITimpact2_Class_predicted,B.MITimpact2_Prob_N,B.MITimpact2_Prob_P
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1410 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1411
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1412 #mitimpact24
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1413 if [ $mitimpact24 == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1414 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1415 echo -e "\nmitimpact24 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1416 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver -dbtype mitimpact24 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1417
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1418 #annovarout="annovarinput.${buildver}_mitimpact24_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1419 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1420 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1421 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1422 gsub(",","\t",$24)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1423 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1424 }END{}' annovarinput.${buildver}_mitimpact24_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1425
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1426 sed -i '1i\db\tMITimpact24_Gene_symbol\tMITimpact24_OXPHOS_Complex\tMITimpact24_Ensembl_Gene_ID\tMITimpact24_Ensembl_Protein_ID\tMITimpact24_Uniprot_Name\tMITimpact24_Uniprot_ID\tMITimpact24_NCBI_Gene_ID\tMITimpact24_NCBI_Protein_ID\tMITimpact24_Gene_pos\tMITimpact24_AA_pos\tMITimpact24_AA_sub\tMITimpact24_Codon_sub\tMITimpact24_dbSNP_ID\tMITimpact24_PhyloP_46V\tMITimpact24_PhastCons_46V\tMITimpact24_PhyloP_100V\tMITimpact24_PhastCons_100V\tMITimpact24_SiteVar\tMITimpact24_PolyPhen24_prediction\tMITimpact24_PolyPhen24_score\tMITimpact24_SIFT_prediction\tMITimpact24_SIFT_score\tMITimpact24_FatHmm_prediction\tMITimpact24_FatHmm_score\tMITimpact24_PROVEAN_prediction\tMITimpact24_PROVEAN_score\tMITimpact24_MutAss_prediction\tMITimpact24_MutAss_score\tMITimpact24_EFIN_Swiss_Prot_Score\tMITimpact24_EFIN_Swiss_Prot_Prediction\tMITimpact24_EFIN_HumDiv_Score\tMITimpact24_EFIN_HumDiv_Prediction\tMITimpact24_CADD_score\tMITimpact24_CADD_Phred_score\tMITimpact24_CADD_prediction\tMITimpact24_Carol_prediction\tMITimpact24_Carol_score\tMITimpact24_Condel_score\tMITimpact24_Condel_pred\tMITimpact24_COVEC_WMV\tMITimpact24_COVEC_WMV_prediction\tMITimpact24_PolyPhen24_score_transf\tMITimpact24_PolyPhen24_pred_transf\tMITimpact24_SIFT_score_transf\tMITimpact24_SIFT_pred_transf\tMITimpact24_MutAss_score_transf\tMITimpact24_MutAss_pred_transf\tMITimpact24_Perc_coevo_Sites\tMITimpact24_Mean_MI_score\tMITimpact24_COSMIC_ID\tMITimpact24_Tumor_site\tMITimpact24_Examined_samples\tMITimpact24_Mutation_frequency\tMITimpact24_US\tMITimpact24_Status\tMITimpact24_Associated_disease\tMITimpact24_Presence_in_TD\tMITimpact24_Class_predicted\tMITimpact24_Prob_N\tMITimpact24_Prob_P\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1427 joinresults originalfile $annovarout 62 63 64 65 66 B.MITimpact24_Gene_symbol,B.MITimpact24_OXPHOS_Complex,B.MITimpact24_Ensembl_Gene_ID,B.MITimpact24_Ensembl_Protein_ID,B.MITimpact24_Uniprot_Name,B.MITimpact24_Uniprot_ID,B.MITimpact24_NCBI_Gene_ID,B.MITimpact24_NCBI_Protein_ID,B.MITimpact24_Gene_pos,B.MITimpact24_AA_pos,B.MITimpact24_AA_sub,B.MITimpact24_Codon_sub,B.MITimpact24_dbSNP_ID,B.MITimpact24_PhyloP_46V,B.MITimpact24_PhastCons_46V,B.MITimpact24_PhyloP_100V,B.MITimpact24_PhastCons_100V,B.MITimpact24_SiteVar,B.MITimpact24_PolyPhen24_prediction,B.MITimpact24_PolyPhen24_score,B.MITimpact24_SIFT_prediction,B.MITimpact24_SIFT_score,B.MITimpact24_FatHmm_prediction,B.MITimpact24_FatHmm_score,B.MITimpact24_PROVEAN_prediction,B.MITimpact24_PROVEAN_score,B.MITimpact24_MutAss_prediction,B.MITimpact24_MutAss_score,B.MITimpact24_EFIN_Swiss_Prot_Score,B.MITimpact24_EFIN_Swiss_Prot_Prediction,B.MITimpact24_EFIN_HumDiv_Score,B.MITimpact24_EFIN_HumDiv_Prediction,B.MITimpact24_CADD_score,B.MITimpact24_CADD_Phred_score,B.MITimpact24_CADD_prediction,B.MITimpact24_Carol_prediction,B.MITimpact24_Carol_score,B.MITimpact24_Condel_score,B.MITimpact24_Condel_pred,B.MITimpact24_COVEC_WMV,B.MITimpact24_COVEC_WMV_prediction,B.MITimpact24_PolyPhen24_score_transf,B.MITimpact24_PolyPhen24_pred_transf,B.MITimpact24_SIFT_score_transf,B.MITimpact24_SIFT_pred_transf,B.MITimpact24_MutAss_score_transf,B.MITimpact24_MutAss_pred_transf,B.MITimpact24_Perc_coevo_Sites,B.MITimpact24_Mean_MI_score,B.MITimpact24_COSMIC_ID,B.MITimpact24_Tumor_site,B.MITimpact24_Examined_samples,B.MITimpact24_Mutation_frequency,B.MITimpact24_US,B.MITimpact24_Status,B.MITimpact24_Associated_disease,B.MITimpact24_Presence_in_TD,B.MITimpact24_Class_predicted,B.MITimpact24_Prob_N,B.MITimpact24_Prob_P
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1428 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1429
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1430
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1431 #GoNL database
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1432 if [ $gonl == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1433 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1434
7
69e2067a120d Uploaded
saskia-hiltemann
parents: 5
diff changeset
1435 if [ $buildver == "hg19" ]
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1436 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1437 echo -e "\nGoNL Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1438 $scriptsdir/annotate_variation.pl --filter --buildver $buildver --otherinfo -dbtype generic -genericdbfile ${buildver}_gonl.txt annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1439
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1440 ls
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1441 annovarout=annovarinput.${buildver}_generic_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1442
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1443 head $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1444
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1445 sed -i '1i\db\tGoNL\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1446 joinresults originalfile $annovarout 3 4 5 6 7 B.GoNL
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1447
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1448 fi
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1449
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1450 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1451
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1452 #SPIDEX database
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1453 if [ $spidex == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1454 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1455
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1456 if [ $buildver == "hg19" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1457 then
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1458 echo -e "\nSPIDEX Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1459 $scriptsdir/annotate_variation.pl --filter --buildver $buildver --otherinfo -dbtype spidex annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1460
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1461 # split allelefrequency column into several columns, one per population
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1462 awk 'BEGIN{FS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1463 OFS="\t"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1464 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1465 gsub(",","\t",$2)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1466 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1467 }END{}' annovarinput.${buildver}_spidex_dropped > $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1468
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1469 #annovarout=annovarinput.${buildver}_spidex_dropped
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1470 #head $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1471
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1472 sed -i '1i\db\tSPIDEX_dpsi_max_tissue\tSPIDEX_dpsi_zscore\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1473 joinresults originalfile $annovarout 4 5 6 7 8 B.SPIDEX_dpsi_max_tissue,B.SPIDEX_dpsi_zscore
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1474 fi
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1475
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1476 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1477
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1478 #GERP++
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1479 if [ $gerp == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1480 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1481 echo -e "\nGERP++ Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1482 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype gerp++gt2 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1483
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1484 annovarout="annovarinput.${buildver}_gerp++gt2_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1485 sed -i '1i\db\tGERP++\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1486 joinresults originalfile $annovarout 3 4 5 6 7 B.GERP++
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1487 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1488
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1489
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1490 #COSMIC
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1491 if [[ $cosmic61 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1492 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1493 echo -e "\nCOSMIC61 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1494 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic61 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1495
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1496 annovarout="annovarinput.${buildver}_cosmic61_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1497 sed -i '1i\db\tCOSMIC61\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1498 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC61
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1499
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1500 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1501
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1502 if [[ $cosmic63 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1503 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1504 echo -e "\nCOSMIC63 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1505 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic63 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1506
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1507 annovarout="annovarinput.${buildver}_cosmic63_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1508 sed -i '1i\db\tCOSMIC63\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1509 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC63
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1510
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1511 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1512
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1513 if [[ $cosmic64 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1514 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1515 echo -e "\nCOSMIC64 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1516 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic64 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1517
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1518 annovarout="annovarinput.${buildver}_cosmic64_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1519 sed -i '1i\db\tCOSMIC64\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1520 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC64
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1521
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1522 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1523
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1524 if [[ $cosmic65 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1525 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1526 echo -e "\nCOSMIC65 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1527 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic65 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1528
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1529 annovarout="annovarinput.${buildver}_cosmic65_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1530 sed -i '1i\db\tCOSMIC65\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1531 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC65
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1532
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1533 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1534
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1535 if [[ $cosmic67 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1536 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1537 echo -e "\nCOSMIC67 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1538 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic67 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1539
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1540 annovarout="annovarinput.${buildver}_cosmic67_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1541 sed -i '1i\db\tCOSMIC67\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1542 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC67
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1543
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1544 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1545
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1546 if [[ $cosmic68 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1547 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1548 echo -e "\nCOSMIC68 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1549 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic68 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1550
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1551 annovarout="annovarinput.${buildver}_cosmic68_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1552 sed -i '1i\db\tCOSMIC68\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1553 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC68
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1554
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1555 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1556
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1557 if [[ $cosmic70 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1558 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1559 echo -e "\nCOSMIC70 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1560 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic70 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1561
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1562 annovarout="annovarinput.${buildver}_cosmic70_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1563 sed -i '1i\db\tCOSMIC70\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1564 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC70
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1565
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1566 fi
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1567
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1568 if [[ $clinvar == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1569 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1570 echo -e "\nCLINVAR Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1571 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype clinvar_20140211 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1572
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1573 annovarout="annovarinput.${buildver}_clinvar_20140211_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1574 sed -i '1i\db\tCLINVAR\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1575 joinresults originalfile $annovarout 3 4 5 6 7 B.CLINVAR
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1576
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1577 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1578
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1579 if [[ $nci60 == "Y" && $buildver == "hg19" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1580 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1581 echo -e "\nNCI60 Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1582 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype nci60 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1583
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1584 annovarout="annovarinput.${buildver}_nci60_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1585 sed -i '1i\db\tNCI60\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1586 joinresults originalfile $annovarout 3 4 5 6 7 B.NCI60
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1587
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1588 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1589
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1590 #cg46
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1591 if [[ $cg46 == "Y" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1592 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1593 echo -e "\nCG 46 genomes Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1594 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cg46 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1595
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1596 annovarout="annovarinput.${buildver}_cg46_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1597 sed -i '1i\db\t'${cg46_colheader}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1598 joinresults originalfile $annovarout 3 4 5 6 7 B.${cg46_colheader}
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1599
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1600 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1601
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1602
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1603 #cg69
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1604 if [[ $cg69 == "Y" ]]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1605 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1606 echo -e "\nCG 69 genomes Annotation"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1607 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cg69 annovarinput $humandb 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1608
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1609 annovarout="annovarinput.${buildver}_cg69_dropped"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1610 sed -i '1i\db\t'${cg69_colheader}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1611 joinresults originalfile $annovarout 3 4 5 6 7 B.${cg69_colheader}
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1612
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1613 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1614
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1615
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1616
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1617 if [ $convertcoords == "Y" ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1618 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1619 echo "converting back coordinates"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1620 awk 'BEGIN{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1621 FS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1622 OFS="\t";
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1623 }{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1624 if (FNR==1)
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1625 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1626 if(FNR>1) {
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1627 $"'"${chrcol}"'" = "chr"$"'"${chrcol}"'"
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1628 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" -= 1 };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1629 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "" };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1630 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" -=1; $"'"${obscol}"'" = "" };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1631 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" -= 1 };
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1632 print $0
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1633 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1634 }
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1635 END{
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1636 }' originalfile > originalfile_coords
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1637 else
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1638 mv originalfile originalfile_coords
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1639 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1640
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1641 #restore "chr" prefix?
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1642
8
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1643 #move to outputfile
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1644 if [ ! -s annovarinput.invalid_input ]
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1645 then
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1646 echo "Congrats, your input file contained no invalid lines!" > annovarinput.invalid_input
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1647 fi
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1648
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1649 cp originalfile_coords $outfile_all
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1650 cp annovarinput.invalid_input $outfile_invalid 2>&1
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1651
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1652 sed -i 's/chrchr/chr/g' $outfile_all
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1653 sed -i 's/chrchr/chr/g' $outfile_invalid
d6af2a78617f added support for databases upto 4 march 2016
saskia-hiltemann
parents: 7
diff changeset
1654
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1655 fi #if $dorunannovar
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1656
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1657
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1658
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1659
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1660
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1661
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1662
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1663
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1664
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1665
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1666
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1667
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1668
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1669
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1670
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1671
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1672
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1673
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1674
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1675
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1676
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1677
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1678