annotate tools/annovar/annovar.sh @ 5:4600be69b96f draft

Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
author saskia-hiltemann
date Thu, 01 Oct 2015 04:24:45 -0400
parents ff5325029a8e
children 69e2067a120d
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1 #!/bin/bash
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
3 test="N"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
4 dofilter="N"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
5
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
6 #########################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
7 # DEFINE SOME
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
8 # FUNCTIONS
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
9 #########################
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
10
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
11 function usage(){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
12 echo "usage: $0 todo"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
13 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
14
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
15 function runfilter(){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
16 ifile=$1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
17 columnname=$2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
18 threshold=$3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
19
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
20 if [[ $threshold == "-1" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
21 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
22 echo "not filtering"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
23 return
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
24 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
25
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
26 echo "filtering: $columnname, $threshold"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
27 cat $ifile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
28
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
29 #get column number corresponding to column header
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
30 column=`awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
31 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
32 col=-1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
33 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
34 if(FNR==1){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
35 for(i=1;i<=NF;i++){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
36 if($i == "'"${columnname}"'")
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
37 col=i
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
38 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
39 print col
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
40 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
41 }' $ifile `
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
42
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
43 if [ $column == -1 ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
44 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
45 echo "no such column, exiting"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
46 return
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
47 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
48
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
49 #perform filtering using the threshold
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
50 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
51 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
52 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
53 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
54 if(FNR==1)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
55 print $0;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
56 if(FNR>1){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
57 if( $"'"${column}"'" == "" ) # empty column, then print
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
58 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
59 else if ("'"${threshold}"'" == "text"){} #if set to text dont check threshold
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
60
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
61 else if ($"'"${column}"'" < "'"${threshold}"'") #else do check it
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
62 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
63 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
64 }' $ifile > tmpfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
65
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
66 mv tmpfile $ifile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
67 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
68
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
69 # arguments: originalfile,resultfile,chrcol,startcol,endcol,refcol,obscol,addcols
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
70 function joinresults(){
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
71 ofile=$1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
72 rfile=$2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
73 colchr=$3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
74 colstart=$4
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
75 colend=$5
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
76 colref=$6
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
77 colobs=$7
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
78 addcols=$8 #e.g. "B.col1,B.col2"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
79
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
80 test="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
81
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
82 # echo "joining result with original file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
83 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
84 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
85 echo "ofile: $ofile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
86 head $ofile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
87 echo "rfile: $rfile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
88 head $rfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
89 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
90 numlines=`wc $rfile | cut -d" " -f2`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
91
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
92 # if empty results file, just add header fields
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
93 if [[ ! -s $rfile ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
94 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
95 dummycol=${addcols:2}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
96 outputcol=${dummycol//",B."/" "}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
97 numcommas=`echo "$addcols" | grep -o "," | wc -l`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
98
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
99 awk 'BEGIN{FS="\t";OFS="\t"}{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
100 if(FNR==1)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
101 print $0,"'"$outputcol"'";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
102 else{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
103 printf $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
104 for(i=0;i<="'"$numcommas"'"+1;i++)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
105 printf "\t"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
106 printf "\n"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
107 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
108 }END{}' $ofile > tempofile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
109
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
110 mv tempofile $ofile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
111 return
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
112 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
113
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
114
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
115 #get input file column names for cgatools join
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
116 col_chr_name=`head -1 $rfile | cut -f${colchr}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
117 col_start_name=`head -1 $rfile | cut -f${colstart}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
118 col_end_name=`head -1 $rfile | cut -f${colend}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
119 col_ref_name=`head -1 $rfile | cut -f${colref}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
120 col_obs_name=`head -1 $rfile | cut -f${colobs}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
121
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
122 #get annotation file column names for cgatools join
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
123 chr_name=`head -1 $ofile | cut -f${chrcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
124 start_name=`head -1 $ofile | cut -f${startcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
125 end_name=`head -1 $ofile | cut -f${endcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
126 ref_name=`head -1 $ofile | cut -f${refcol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
127 obs_name=`head -1 $ofile | cut -f${obscol}`
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
128
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
129 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
130 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
131 echo "input file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
132 echo "chr col: $col_chr_name ($colchr)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
133 echo "start col: $col_start_name ($colstart)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
134 echo "end col: $col_end_name ($colend)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
135 echo "ref col: $col_ref_name ($colref)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
136 echo "obs col: $col_obs_name ($colobs)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
137 echo ""
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
138 echo "annotation file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
139 echo "chr col: $chr_name ($chrcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
140 echo "start col: $start_name ($startcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
141 echo "end col: $end_name ($endcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
142 echo "ref col: $ref_name ($refcol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
143 echo "obs col: $obs_name ($obscol)"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
144 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
145
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
146 #perform join
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
147 cgatools join --beta \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
148 --input $ofile $rfile \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
149 --output temporiginal \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
150 --match ${chr_name}:${col_chr_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
151 --match ${start_name}:${col_start_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
152 --match ${end_name}:${col_end_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
153 --match ${ref_name}:${col_ref_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
154 --match ${obs_name}:${col_obs_name} \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
155 --select A.*,$addcols \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
156 --always-dump \
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
157 --output-mode compact
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
158
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
159 #replace originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
160 sed -i 's/^>//g' temporiginal #join sometimes adds a '>' symbol to header
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
161 mv temporiginal originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
162
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
163 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
164 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
165 echo "joining complete"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
166 head originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
167 echo ""
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
168 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
169
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
170 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
171
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
172
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
173
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
174
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
175 #################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
176 #
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
177 # PARSE PARAMETERS
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
178 #
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
179 #################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
180
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
181
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
182 set -- `getopt -n$0 -u -a --longoptions="inputfile: buildver: humandb: varfile: VCF: chrcol: startcol: endcol: refcol: obscol: vartypecol: convertcoords: geneanno: hgvs: verdbsnp: tfbs: mce: cytoband: segdup: dgv: gwas: ver1000g: cg46: cg69: impactscores: newimpactscores: otherinfo: esp: exac03: spidex: gonl: gerp: cosmic61: cosmic63: cosmic64: cosmic65: cosmic67: cosmic68: clinvar: nci60: outall: outfilt: outinvalid: scriptsdir: dorunannovar: dofilter: filt_dbsnp: filt1000GALL: filt1000GAFR: filt1000GAMR: filt1000GASN: filt1000GEUR: filtESP6500ALL: filtESP6500EA: filtESP6500AA: filtcg46: filtcg69: dummy:" "h:" "$@"` || usage
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
183 [ $# -eq 0 ] && usage
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
184
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
185
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
186
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
187 while [ $# -gt 0 ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
188 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
189 case "$1" in
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
190 --inputfile) infile=$2;shift;; # inputfile
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
191 --buildver) buildvertmp=$2;shift;; # hg18 or hg19
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
192 --humandb) humandbtmp=$2;shift;; # location of humandb database
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
193 --varfile) varfile=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
194 --VCF) vcf=$2;shift;; #Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
195 --chrcol) chrcol=$2;shift;; # which column has chr
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
196 --startcol) startcol=$2;shift;; # which column has start
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
197 --endcol) endcol=$2;shift;; # which column has end
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
198 --refcol) refcol=$2;shift;; # which column has ref
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
199 --obscol) obscol=$2;shift;; # which column has alt
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
200 --vartypecol) vartypecol=$2;shift;; # which column has vartype
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
201 --convertcoords) convertcoords=$2;shift;; # Y or N convert coordinate from CG to 1-based?
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
202 --geneanno) geneanno=$2;shift;; # comma-separated list of strings refSeq, knowngene, ensgene
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
203 --hgvs) hgvs=$2;shift;;
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
204 --verdbsnp) verdbsnp=$2;shift;; #comma-separated list of dbsnp version to annotate with (e.g. "132,135NonFlagged,137,138")"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
205 --tfbs) tfbs=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
206 --mce) mce=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
207 --cytoband) cytoband=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
208 --segdup) segdup=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
209 --dgv) dgv=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
210 --gwas) gwas=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
211 --ver1000g) ver1000g=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
212 --cg46) cg46=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
213 --cg69) cg69=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
214 --impactscores) impactscores=$2;shift;; # Y or N
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
215 --newimpactscores) newimpactscores=$2;shift;; # Y or N
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
216 --otherinfo) otherinfo=$2;shift;;
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
217 --scriptsdir) scriptsdirtmp=$2;shift;; # Y or N
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
218 --esp) esp=$2;shift;; # Y or N
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
219 --exac03) exac03=$2;shift;;
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
220 --gonl) gonl=$2;shift;;
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
221 --spidex) spidex=$2;shift;;
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
222 --gerp) gerp=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
223 --cosmic61) cosmic61=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
224 --cosmic63) cosmic63=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
225 --cosmic64) cosmic64=$2;shift;; # Y or N
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
226 --cosmic65) cosmic65=$2;shift;; # Y or N
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
227 --cosmic67) cosmic67=$2;shift;; # Y or N
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
228 --cosmic68) cosmic68=$2;shift;; # Y or N
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
229 --nci60) nci60=$2;shift;; # Y or N
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
230 --clinvar) clinvar=$2;shift;; # Y or N
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
231 --filt_dbsnp) filt_dbsnp=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
232 --filt1000GALL) threshold_1000g_ALL=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
233 --filt1000GAFR) threshold_1000g_AFR=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
234 --filt1000GAMR) threshold_1000g_AMR=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
235 --filt1000GASN) threshold_1000g_ASN=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
236 --filt1000GEUR) threshold_1000g_EUR=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
237 --filtESP6500ALL) threshold_ESP6500_ALL=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
238 --filtESP6500EA) threshold_ESP6500_EA=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
239 --filtESP6500AA) threshold_ESP6500_AA=$2;shift;; #threshold value
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
240 --filtcg46) threshold_cg46=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
241 --filtcg69) threshold_cg69=$2;shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
242 --outall) outfile_all=$2;shift;; # file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
243 --outfilt) outfile_filt=$2;shift;; # file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
244 --outinvalid) outfile_invalid=$2;shift;; #file
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
245 --dorunannovar) dorunannovar=$2;shift;; #Y or N
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
246 -h) shift;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
247 --) shift;break;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
248 -*) usage;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
249 *) break;;
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
250 esac
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
251 shift
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
252 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
253
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
254 #sometimes galaxy screws up these variables after updates, if comma-separated list, use only what is before first comma
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
255 humandb=${humandbtmp%,*}
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
256 buildver=${buildvertmp%,*}
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
257 scriptsdir=${scriptsdirtmp%,*}
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
258
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
259
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
260 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
261 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
262 echo "dorunannovar: $dorunannovar"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
263 echo "infile: $infile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
264 echo "buildver: $buildver"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
265 echo "annovardb: $humandb"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
266 echo "verdbnsp: $verdbsnp"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
267 echo "geneanno: $geneanno"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
268 echo "tfbs: $tfbs"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
269 echo "mce: $mce"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
270 echo "cytoband: $cytoband"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
271 echo "segdup: $segdup"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
272 echo "dgv: $dgv"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
273 echo "gwas: $gwas"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
274 echo "g1000: ${g1000}"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
275 echo "cg46: ${cg46}"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
276 echo "cg69: ${cg69}"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
277 echo "impactscores: $impactscores"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
278 echo "impactscores: $newimpactscores"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
279 echo "esp: $esp"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
280 echo "gerp: $gerp"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
281 echo "cosmic: $cosmic"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
282 echo "outfile: $outfile_all"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
283 echo "outinvalid: $outfile_invalid"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
284 echo "outfiltered: $outfile_filt"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
285 echo "varfile: $varfile"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
286 echo "vcf" $vcf
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
287 echo "chrcol: $chrcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
288 echo "startcol: $startcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
289 echo "endcol: $endcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
290 echo "refcol: $refcol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
291 echo "obscol: $obscol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
292 echo "convertcoords: $convertcoords"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
293 echo "vartypecol: $vartypecol"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
294 echo "dofilter: $dofilter"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
295 echo "threshold_1000g_ALL : $threshold_1000g_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
296 echo "threshold_1000g_AFR : $threshold_1000g_AFR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
297 echo "threshold_1000g_AMR : $threshold_1000g_AMR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
298 echo "threshold_1000g_ASN : $threshold_1000g_ASN"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
299 echo "threshold_1000g_EUR : $threshold_1000g_EUR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
300 echo "threshold_ESP6500_ALL: $threshold_ESP6500_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
301 echo "threshold_ESP6500_EA : $threshold_ESP6500_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
302 echo "threshold_ESP6500_AA : $threshold_ESP6500_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
303
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
304 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
305
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
306
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
307
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
308 ############################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
309 #
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
310 # Annotate Variants
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
311 #
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
312 ############################################
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
313
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
314 #parse geneanno param
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
315 refgene="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
316 knowngene="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
317 ensgene="N"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
318
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
319 if [[ $geneanno =~ "refSeq" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
320 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
321 refgene="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
322 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
323 if [[ $geneanno =~ "knowngene" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
324 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
325 knowngene="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
326 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
327 if [[ $geneanno =~ "ensgene" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
328 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
329 ensgene="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
330 fi
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
331 if [ $hgvs == "N" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
332 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
333 hgvs=""
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
334 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
335
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
336 #parse verdbsnp/1000g/esp strings
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
337 dbsnpstr=${verdbsnp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
338 filt_dbsnpstr=${filt_dbsnp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
339 g1000str=${ver1000g//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
340 espstr=${esp//,/ }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
341
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
342 if [ $test == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
343 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
344 echo "annotate dbsnp: $dbsnpstr"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
345 echo "annotate esp: $espstr"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
346 echo "filter dbsnp: $filt_dbsnpstr"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
347 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
348
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
349 mutationtaster="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
350 avsift="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
351 lrt="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
352 polyphen2="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
353 phylop="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
354 ljbsift="N"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
355
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
356 #parse old impactscores param (obsolete)
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
357 if [[ $impactscores =~ "mutationtaster" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
358 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
359 mutationtaster="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
360 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
361 if [[ $impactscores =~ "sift" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
362 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
363 avsift="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
364 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
365 if [[ $impactscores =~ "lrt" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
366 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
367 lrt="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
368 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
369 if [[ $impactscores =~ "ljbsift" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
370 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
371 ljbsift="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
372 fi
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
373 if [[ $impactscores =~ "ljb2sift" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
374 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
375 ljb2sift="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
376 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
377 if [[ $impactscores =~ "pp2" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
378 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
379 polyphen2="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
380 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
381 if [[ $impactscores =~ "phylop" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
382 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
383 phylop="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
384 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
385
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
386 if [[ $varfile == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
387 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
388 convertcoords="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
389 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
390
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
391 #ljb refers to Liu, Jian, Boerwinkle paper in Human Mutation with pubmed ID 21520341. Cite this paper if you use the scores
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
392
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
393 ljb2_sift="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
394 ljb2_pp2hdiv="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
395 ljb2_pp2hvar="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
396 ljb2_lrt="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
397 ljb2_mt="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
398 ljb2_ma="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
399 ljb2_fathmm="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
400 ljb2_gerp="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
401 ljb2_phylop="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
402 ljb2_siphy="N"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
403
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
404 # parse ljb2 newimpactscores param
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
405 # ljb2_sift, ljb2_pp2hdiv, ljb2_pp2hvar, ljb2_lrt, ljb2_mt, ljb2_ma, ljb2_fathmm, ljb2_gerp++, ljb2_phylop, ljb2_siphy
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
406 if [[ $newimpactscores =~ "ljb2_sift" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
407 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
408 ljb2_sift="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
409 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
410 if [[ $newimpactscores =~ "ljb2_pp2hdiv" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
411 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
412 ljb2_pp2hdiv="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
413 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
414 if [[ $newimpactscores =~ "ljb2_pp2hvar" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
415 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
416 ljb2_pp2hvar="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
417 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
418 if [[ $newimpactscores =~ "ljb2_lrt" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
419 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
420 ljb2_lrt="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
421 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
422 if [[ $newimpactscores =~ "ljb2_mt" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
423 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
424 ljb2_mt="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
425 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
426 if [[ $newimpactscores =~ "ljb2_ma" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
427 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
428 ljb2_ma="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
429 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
430 if [[ $newimpactscores =~ "ljb2_fathmm" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
431 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
432 ljb2_fathmm="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
433 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
434 if [[ $newimpactscores =~ "ljb2_gerp" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
435 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
436 ljb2_gerp="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
437 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
438 if [[ $newimpactscores =~ "ljb2_phylop" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
439 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
440 ljb2_phylop="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
441 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
442 if [[ $newimpactscores =~ "ljb2_siphy" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
443 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
444 ljb2_siphy="Y"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
445 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
446
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
447 if [ $otherinfo == "N" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
448 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
449 otherinfo=""
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
450 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
451
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
452
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
453 #column header names we will be adding
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
454 # ESP 6500
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
455 esp6500si_colheader_ALL="ESP6500si_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
456 esp6500si_colheader_EA="ESP6500si_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
457 esp6500si_colheader_AA="ESP6500si_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
458 esp6500_colheader_ALL="ESP6500_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
459 esp6500_colheader_EA="ESP6500_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
460 esp6500_colheader_AA="ESP6500_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
461 esp5400si_colheader_ALL="ESP5400si_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
462 esp5400si_colheader_EA="ESP5400si_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
463 esp5400si_colheader_AA="ESP5400si_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
464 esp5400_colheader_ALL="ESP5400_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
465 esp5400_colheader_EA="ESP5400_EA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
466 esp5400_colheader_AA="ESP5400_AA"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
467
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
468
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
469 # cg46 cg69
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
470 cg46_colheader="CG_46_genomes"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
471 cg69_colheader="CG_69_genomes"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
472
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
473 cp $infile originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
474 #run annovar or filter only?
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
475 if [ $dorunannovar == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
476 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
477
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
478
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
479 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
480 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
481 # PREPARE INPUT FILE
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
482 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
483 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
484
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
485 echo "converting input file"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
486 vcfheader=""
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
487 if [ $vcf == "Y" ] #if CG varfile, convert
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
488 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
489 # convert vcf to annovarinput
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
490 $scriptsdir/convert2annovar.pl --format vcf4old --allallele --includeinfo --outfile annovarinput $infile 2>&1
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
491
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
492 #construct header line from vcf file
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
493 cat $infile | grep "#CHROM" > additionalcols
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
494 sed -i 's/#//g' additionalcols
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
495 vcfheader="\t`cat additionalcols`"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
496 echo "vcfheader:$vcfheader"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
497 echo -e "chromosome\tbegin\tend\treference\tobserved\t`cat additionalcols`" > originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
498 cat annovarinput >> originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
499
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
500 chrcol=1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
501 startcol=2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
502 endcol=3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
503 refcol=4
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
504 obscol=5
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
505
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
506
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
507 elif [ $varfile == "Y" ] #if CG varfile, convert
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
508 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
509 # convert varfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
510 $scriptsdir/convert2annovar.pl --format cg --outfile annovarinput $infile 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
511 echo -e "chromosome\tbegin\tend\treference\talleleSeq\tvarType\thaplotype" > originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
512 cat annovarinput | cut -f1-6,8 >> originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
513 cat annovarinput | cut -f1-5 >> annovarinput2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
514 mv annovarinput2 annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
515
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
516 chrcol=1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
517 startcol=2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
518 endcol=3
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
519 refcol=4
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
520 obscol=5
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
521
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
522 elif [ $convertcoords == "Y" ] # if CG-coordinates, convert
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
523 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
524 #echo "rearranging columns and converting coordinates"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
525 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
526 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
527 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
528 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
529 if(FNR>1) {
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
530 gsub(/chr/,"",$"'"${chrcol}"'")
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
531 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
532 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
533 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" +=1; $"'"${obscol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
534 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
535
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
536 printf("%s\t%s\t%s\t%s\t%s\n" ,$"'"${chrcol}"'",$"'"${startcol}"'",$"'"${endcol}"'",$"'"${refcol}"'",$"'"${obscol}"'");
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
537 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
538 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
539 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
540 }' $infile > annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
541
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
542 #remove any "chr" prefixes
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
543 #sed -i '2,$s/chr//g' annovarinput
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
544
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
545 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
546 FS="\t";
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
547 OFS="\t";
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
548 }{
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
549
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
550 if(FNR>=1) {
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
551 gsub(/chr/,"",$"'"${chrcol}"'")
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
552 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
553 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
554 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" +=1; $"'"${obscol}"'" = "-" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
555 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" += 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
556
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
557 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
558 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
559 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
560 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
561 }' $infile > originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
562
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
563 #remove any "chr" prefixes
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
564 #sed -i '2,$s/chr//g' originalfile
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
565 sed -i 's/omosome/chromosome/g' originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
566
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
567
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
568 else #only rearrange columns if already 1-based coordinates
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
569 echo "rearranging columns "
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
570 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
571 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
572 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
573 }{
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
574 if(FNR>1) {
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
575 printf("%s\t%s\t%s\t%s\t%s\n",$"'"${chrcol}"'",$"'"${startcol}"'",$"'"${endcol}"'",$"'"${refcol}"'",$"'"${obscol}"'");
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
576 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
577 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
578 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
579 }' $infile > annovarinput
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
580
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
581 #remove any "chr" prefixes
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
582 sed -i '2,$s/chr//g' annovarinput
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
583 sed '2,$s/chr//g' $infile > originalfile
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
584 sed -i 's/omosome/chromosome/g' originalfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
585 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
586
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
587 echo "...finished conversion"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
588
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
589
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
590
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
591
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
592 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
593 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
594 # RUN ANNOVAR COMMANDS
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
595 #
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
596 ####################################
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
597
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
598
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
599
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
600 ###### gene-based annotation #######
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
601
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
602 # RefSeq Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
603 if [ $refgene == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
604 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
605 echo -e "\nrefSeq gene"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
606 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype gene ${hgvs} annovarinput $humandb 2>&1
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
607
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
608 annovarout=annovarinput.variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
609 sed -i '1i\RefSeq_Func\tRefSeq_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
610 joinresults originalfile $annovarout 3 4 5 6 7 B.RefSeq_Func,B.RefSeq_Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
611
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
612 annovarout=annovarinput.exonic_variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
613 sed -i '1i\linenum\tRefSeq_ExonicFunc\tRefSeq_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
614 joinresults originalfile $annovarout 4 5 6 7 8 B.RefSeq_ExonicFunc,B.RefSeq_AAChange
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
615 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
616
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
617
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
618 # UCSC KnownGene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
619 if [ $knowngene == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
620 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
621 echo -e "\nUCSC known gene"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
622 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype knowngene annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
623
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
624 annovarout=annovarinput.variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
625 sed -i '1i\UCSCKnownGene_Func\tUCSCKnownGene_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
626 joinresults originalfile $annovarout 3 4 5 6 7 B.UCSCKnownGene_Func,B.UCSCKnownGene_Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
627
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
628 annovarout=annovarinput.exonic_variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
629 sed -i '1i\linenum\tUCSCKnownGene_ExonicFunc\tUCSCKnownGene_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
630 joinresults originalfile $annovarout 4 5 6 7 8 B.UCSCKnownGene_ExonicFunc,B.UCSCKnownGene_AAChange
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
631 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
632
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
633
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
634 # Emsembl Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
635 if [ $ensgene == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
636 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
637 echo -e "\nEnsembl gene"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
638 $scriptsdir/annotate_variation.pl --geneanno --buildver $buildver -dbtype ensgene annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
639
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
640 annovarout=annovarinput.variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
641 sed -i '1i\EnsemblGene_Func\tEnsemblGene_Gene\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
642 joinresults originalfile $annovarout 3 4 5 6 7 B.EnsemblGene_Func,B.EnsemblGene_Gene
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
643
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
644 annovarout=annovarinput.exonic_variant_function
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
645 sed -i '1i\linenum\tEnsemblGene_ExonicFunc\tEnsemblGene_AAChange\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
646 joinresults originalfile $annovarout 4 5 6 7 8 B.EnsemblGene_ExonicFunc,B.EnsemblGene_AAChange
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
647 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
648
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
649
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
650
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
651 ###### region-based annotation #######
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
652
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
653
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
654 # Transcription Factor Binding Sites Annotation
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
655 if [ $mce == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
656 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
657 echo -e "\nMost Conserved Elements"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
658
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
659 if [ $buildver == "hg18" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
660 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
661 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype mce44way annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
662 annovarout=annovarinput.${buildver}_phastConsElements44way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
663 sed -i '1i\db\tphastConsElements44way\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
664 joinresults originalfile $annovarout 3 4 5 6 7 B.phastConsElements44way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
665
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
666 else #hg19
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
667 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype mce46way annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
668 annovarout=annovarinput.${buildver}_phastConsElements46way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
669 sed -i '1i\db\tphastConsElements46way\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
670 joinresults originalfile $annovarout 3 4 5 6 7 B.phastConsElements46way
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
671 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
672
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
673 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
674
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
675
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
676
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
677 # Transcription Factor Binding Sites Annotation
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
678 if [ $tfbs == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
679 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
680 echo -e "\nTranscription Factor Binding Site Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
681 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype tfbs annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
682
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
683 # arguments: originalfile, resultfile,chrcol,startcol,endcol,refcol,obscol,selectcolumns
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
684 annovarout=annovarinput.${buildver}_tfbsConsSites
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
685 sed -i '1i\db\tTFBS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
686 joinresults originalfile $annovarout 3 4 5 6 7 B.TFBS
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
687 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
688
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
689
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
690
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
691 # Identify cytogenetic band for genetic variants
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
692 if [ $cytoband == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
693 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
694 echo -e "\nCytogenic band Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
695 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype band annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
696
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
697 annovarout=annovarinput.${buildver}_cytoBand
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
698 sed -i '1i\db\tBand\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
699 joinresults originalfile $annovarout 3 4 5 6 7 B.Band
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
700 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
701
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
702
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
703 # Identify variants located in segmental duplications
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
704 if [ $segdup == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
705 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
706 echo -e "\nSegmental Duplications Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
707 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype segdup annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
708
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
709 annovarout=annovarinput.${buildver}_genomicSuperDups
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
710 sed -i '1i\db\tSegDup\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
711 joinresults originalfile $annovarout 3 4 5 6 7 B.SegDup
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
712 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
713
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
714
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
715
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
716 # Identify previously reported structural variants in DGV
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
717 if [ $dgv == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
718 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
719 echo -e "\nDGV Annotation"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
720 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype dgvMerged annovarinput $humandb 2>&1
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
721
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
722 annovarout=annovarinput.${buildver}_dgvMerged
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
723 sed -i '1i\db\tDGV\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
724 joinresults originalfile $annovarout 3 4 5 6 7 B.DGV
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
725 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
726
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
727
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
728 # Identify variants reported in previously published GWAS studies
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
729 if [ $gwas == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
730 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
731 echo -e "\nGWAS Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
732 $scriptsdir/annotate_variation.pl --regionanno --buildver $buildver -dbtype gwascatalog annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
733
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
734 annovarout=annovarinput.${buildver}_gwasCatalog
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
735 sed -i '1i\db\tGWAS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
736 joinresults originalfile $annovarout 3 4 5 6 7 B.GWAS
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
737 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
738
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
739
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
740
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
741
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
742 ###### filter-based annotation #######
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
743
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
744 #dbSNP
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
745 for version in $dbsnpstr
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
746 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
747 if [ $version == "None" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
748 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
749 break
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
750 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
751 echo -e "\ndbSNP region Annotation, version: $version"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
752 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ${version} annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
753
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
754 columnname=${version}
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
755 if [[ $columnname == snp* ]]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
756 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
757 columnname="db${version}"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
758 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
759
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
760 annovarout=annovarinput.${buildver}_${version}_dropped
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
761 sed -i '1i\db\t'${columnname}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
762 joinresults originalfile $annovarout 3 4 5 6 7 B.${columnname}
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
763
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
764
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
765 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
766
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
767
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
768
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
769 #1000 Genomes
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
770
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
771 if [ $ver1000g != "None" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
772 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
773
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
774 for version in $g1000str
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
775 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
776 #column headers
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
777 g1000_colheader_ALL="${version}_ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
778 g1000_colheader_AFR="${version}_AFR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
779 g1000_colheader_AMR="${version}_AMR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
780 g1000_colheader_ASN="${version}_ASN"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
781 g1000_colheader_EUR="${version}_EUR"
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
782 g1000_colheader_EAS="${version}_EAS"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
783 g1000_colheader_SAS="${version}_SAS"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
784 g1000_colheader_CEU="${version}_CEU"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
785 g1000_colheader_YRI="${version}_YRI"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
786 g1000_colheader_JPTCHB="${version}_JPTCHB"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
787
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
788 doALL="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
789 doAMR="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
790 doAFR="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
791 doASN="N"
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
792 doEAS="N"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
793 doSAS="N"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
794 doEUR="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
795 doCEU="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
796 doYRI="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
797 doJPTCHB="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
798
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
799
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
800 if [ $version == "1000g2012apr" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
801 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
802 fileID="2012_04"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
803 doALL="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
804 if [ $buildver == "hg19" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
805 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
806 doAMR="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
807 doAFR="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
808 doASN="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
809 doEUR="Y"
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
810 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
811 elif [ $version == "1000g2014oct" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
812 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
813 fileID="2014_10"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
814 doALL="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
815 doAMR="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
816 doAFR="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
817 doEUR="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
818 doEAS="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
819 if [ $buildver == "hg19" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
820 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
821 doSAS="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
822 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
823
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
824 elif [[ $version == "1000g2015aug" && $buildver == "hg19" ]]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
825 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
826 fileID="2015_08"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
827 doALL="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
828 doAMR="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
829 doAFR="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
830 doEUR="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
831 doEAS="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
832 doSAS="Y"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
833
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
834 elif [[ $version == "1000g2012feb" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
835 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
836 fileID="2012_02"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
837 doALL="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
838 elif [[ $version == "1000g2010nov" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
839 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
840 fileID="2010_11"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
841 doALL="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
842 elif [[ $version == "1000g2010jul" && $buildver == "hg18" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
843 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
844 fileID="2010_07"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
845 doALL="N"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
846 doCEU="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
847 doYRI="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
848 doJPTCHB="Y"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
849 else
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
850 echo "unrecognized 1000g version, skipping"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
851 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
852
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
853 #ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
854 if [ $doALL == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
855 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
856 echo -e "\n1000Genomes ALL"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
857 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_all" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
858
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
859 annovarout=annovarinput.${buildver}_ALL.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
860 sed -i '1i\db\t'$g1000_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
861 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
862 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
863
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
864 # AFR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
865 if [ $doAFR == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
866 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
867 echo -e "\n1000Genomes AFR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
868 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_afr" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
869
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
870 annovarout=annovarinput.${buildver}_AFR.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
871 sed -i '1i\db\t'$g1000_colheader_AFR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
872 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_AFR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
873 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
874
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
875
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
876 # AMR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
877 if [ $doAMR == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
878 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
879 echo -e "\n1000Genomes AMR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
880 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_amr" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
881
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
882 annovarout=annovarinput.${buildver}_AMR.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
883 sed -i '1i\db\t'$g1000_colheader_AMR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
884 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_AMR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
885 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
886
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
887 # ASN
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
888 if [ $doASN == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
889 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
890 echo -e "\n1000Genomes ASN"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
891 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_asn" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
892
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
893 annovarout=annovarinput.${buildver}_ASN.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
894 sed -i '1i\db\t'$g1000_colheader_ASN'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
895 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_ASN
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
896 fi
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
897
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
898 # EAS
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
899 if [ $doEAS == "Y" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
900 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
901 echo -e "\n1000Genomes EAS"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
902 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_eas" annovarinput $humandb 2>&1
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
903
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
904 annovarout=annovarinput.${buildver}_EAS.sites.${fileID}_dropped
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
905 sed -i '1i\db\t'$g1000_colheader_EAS'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
906 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_EAS
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
907 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
908
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
909 # SAS
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
910 if [ $doSAS == "Y" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
911 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
912 echo -e "\n1000Genomes SAS"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
913 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_sas" annovarinput $humandb 2>&1
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
914
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
915 annovarout=annovarinput.${buildver}_SAS.sites.${fileID}_dropped
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
916 sed -i '1i\db\t'$g1000_colheader_SAS'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
917 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_SAS
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
918 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
919
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
920 # EUR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
921 if [ $doEUR == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
922 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
923 echo -e "\n1000Genomes EUR"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
924 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_eur" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
925
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
926 annovarout=annovarinput.${buildver}_EUR.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
927 sed -i '1i\db\t'$g1000_colheader_EUR'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
928 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_EUR
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
929 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
930
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
931 # CEU
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
932 if [ $doCEU == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
933 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
934 echo -e "\n1000Genomes CEU"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
935 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_ceu" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
936
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
937 annovarout=annovarinput.${buildver}_CEU.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
938 sed -i '1i\db\t'$g1000_colheader_CEU'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
939 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_CEU
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
940 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
941
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
942 # YRI
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
943 if [ $doYRI == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
944 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
945 echo -e "\n1000Genomes YRI"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
946 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_yri" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
947
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
948 annovarout=annovarinput.${buildver}_YRI.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
949 sed -i '1i\db\t'$g1000_colheader_YRI'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
950 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_YRI
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
951
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
952
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
953 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
954
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
955 #JPTCHB
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
956 if [ $doJPTCHB == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
957 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
958 echo -e "\n1000Genomes JPTCHB"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
959 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype "${version}_jptchb" annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
960
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
961 annovarout=annovarinput.${buildver}_JPTCHB.sites.${fileID}_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
962 sed -i '1i\db\t'$g1000_colheader_JPTCHB'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
963 joinresults originalfile $annovarout 3 4 5 6 7 B.$g1000_colheader_JPTCHB
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
964 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
965
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
966 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
967 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
968
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
969
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
970
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
971
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
972 #### IMPACT SCORE ANNOTATIONS
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
973
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
974
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
975 if [ $ljb2_sift == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
976 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
977 echo -e "\nLJB2 SIFT Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
978 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_sift annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
979
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
980 annovarout=annovarinput.${buildver}_ljb2_sift_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
981 sed -i '1i\db\tLJB2_SIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
982 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_SIFT
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
983 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
984
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
985 if [ $ljb2_pp2hdiv == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
986 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
987 echo -e "\nLJB2 pp2hdiv Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
988 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_pp2hdiv annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
989
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
990 annovarout=annovarinput.${buildver}_ljb2_pp2hdiv_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
991 sed -i '1i\db\tLJB2_PolyPhen2_HDIV\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
992 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_PolyPhen2_HDIV
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
993 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
994
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
995 if [ $ljb2_pp2hvar == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
996 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
997 echo -e "\nLJB2 pp2hvar Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
998 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_pp2hvar annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
999
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1000 annovarout=annovarinput.${buildver}_ljb2_pp2hvar_dropped
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1001
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1002 head $annovarout
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1003 sed -i '1i\db\tLJB2_PolyPhen2_HVAR\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1004 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_PolyPhen2_HVAR
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1005 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1006
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1007 if [ $ljb2_lrt == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1008 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1009 echo -e "\nLJB2 LRT Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1010 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_lrt annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1011
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1012 annovarout=annovarinput.${buildver}_ljb2_lrt_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1013 sed -i '1i\db\tLJB2_LRT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1014 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_LRT
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1015 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1016
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1017 if [ $ljb2_mt == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1018 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1019 echo -e "\nLJB2 mutationtaster Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1020 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_mt annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1021
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1022 annovarout=annovarinput.${buildver}_ljb2_mt_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1023 sed -i '1i\db\tLJB2_MutationTaster\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1024 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_MutationTaster
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1025 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1026
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1027 if [ $ljb2_ma == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1028 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1029 echo -e "\nLJB2 mutationassessor Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1030 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_ma annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1031
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1032 annovarout=annovarinput.${buildver}_ljb2_ma_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1033 sed -i '1i\db\tLJB2_MutationAssessor\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1034 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_MutationAssessor
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1035 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1036
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1037 if [ $ljb2_fathmm == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1038 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1039 echo -e "\nLJB2 FATHMM Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1040 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_fathmm annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1041
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1042 annovarout=annovarinput.${buildver}_ljb2_fathmm_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1043 sed -i '1i\db\tLJB2_FATHMM\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1044 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_FATHMM
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1045 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1046
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1047 if [ $ljb2_gerp == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1048 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1049 echo -e "\nLJB2 GERP++ Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1050 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_gerp++ annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1051
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1052 annovarout=annovarinput.${buildver}_ljb2_gerp++_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1053 sed -i '1i\db\tLJB2_GERP++\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1054 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_GERP++
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1055 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1056
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1057 if [ $ljb2_phylop == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1058 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1059 echo -e "\nLJB2 PhyloP Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1060 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_phylop annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1061
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1062 annovarout=annovarinput.${buildver}_ljb2_phylop_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1063 sed -i '1i\db\tLJB2_PhyloP\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1064 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_PhyloP
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1065 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1066
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1067 if [ $ljb2_siphy == "Y" ]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1068 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1069 echo -e "\nLJB2 SiPhy Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1070 $scriptsdir/annotate_variation.pl --filter --buildver $buildver $otherinfo -dbtype ljb2_siphy annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1071
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1072 annovarout=annovarinput.${buildver}_ljb2_siphy_dropped
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1073 sed -i '1i\db\tLJB2_SiPhy\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1074 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB2_SiPhy
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1075 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1076
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1077
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1078
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1079 ### OLD IMPACT SCORE ANNOTATIONS
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1080
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1081 # SIFT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1082 if [ $avsift == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1083 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1084 echo -e "\nSIFT Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1085 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype avsift annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1086
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1087 annovarout=annovarinput.${buildver}_avsift_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1088 sed -i '1i\db\tAVSIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1089 joinresults originalfile $annovarout 3 4 5 6 7 B.AVSIFT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1090 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1091
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1092 #ljb refers to Liu, Jian, Boerwinkle paper in Human Mutation with pubmed ID 21520341. Cite this paper if you use the scores
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1093 # SIFT2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1094 if [ $ljbsift == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1095 then
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1096 echo -e "\nLJB SIFT Annotation"
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1097 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_sift annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1098
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1099 annovarout=annovarinput.${buildver}_ljb_sift_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1100 sed -i '1i\db\tLJB_SIFT\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1101 joinresults originalfile $annovarout 3 4 5 6 7 B.LJB_SIFT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1102 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1103
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1104
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1105 # PolyPhen2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1106 if [ $polyphen2 == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1107 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1108 echo -e "\nPolyPhen Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1109 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_pp2 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1110
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1111 annovarout=annovarinput.${buildver}_ljb_pp2_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1112 sed -i '1i\db\tPolyPhen2\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1113 joinresults originalfile $annovarout 3 4 5 6 7 B.PolyPhen2
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1114 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1115
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1116
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1117 # MutationTaster
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1118 if [ $mutationtaster == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1119 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1120 echo -e "\nMutationTaster Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1121 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_mt annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1122
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1123 annovarout=annovarinput.${buildver}_ljb_mt_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1124 sed -i '1i\db\tMutationTaster\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1125 joinresults originalfile $annovarout 3 4 5 6 7 B.MutationTaster
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1126 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1127
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1128
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1129 # LRT
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1130 if [ $lrt == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1131 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1132 echo -e "\nLRT Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1133 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_lrt annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1134
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1135 annovarout=annovarinput.${buildver}_ljb_lrt_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1136 sed -i '1i\db\tLikelihoodRatioTestScore\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1137 joinresults originalfile $annovarout 3 4 5 6 7 B.LikelihoodRatioTestScore
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1138 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1139
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1140 # PhyloP
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1141 if [ $phylop == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1142 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1143 echo -e "\nPhyloP Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1144 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype ljb_phylop annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1145
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1146 annovarout=annovarinput.${buildver}_ljb_phylop_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1147 sed -i '1i\db\tPhyloP\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1148 joinresults originalfile $annovarout 3 4 5 6 7 B.PhyloP
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1149 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1150
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1151
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1152 ### ESP Exome Variant Server
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1153 if [ $esp != "None" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1154 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1155 echo -e "\nESP Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1156 for version in $espstr
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1157 do
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1158 echo "version: $version"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1159 # 6500si ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1160 if [ $version == "esp6500si_all" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1161 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1162 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_all annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1163
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1164 annovarout=annovarinput.${buildver}_esp6500si_all_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1165 sed -i '1i\db\t'$esp6500si_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1166 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1167 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1168
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1169
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1170 # 6500si European American
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1171 if [ $version == "esp6500si_ea" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1172 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1173 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_ea annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1174
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1175 annovarout=annovarinput.${buildver}_esp6500si_ea_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1176 sed -i '1i\db\t'$esp6500si_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1177 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_EA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1178 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1179
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1180 # 6500si African Americans
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1181 if [ $version == "esp6500si_aa" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1182 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1183 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500si_aa annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1184
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1185 annovarout=annovarinput.${buildver}_esp6500si_aa_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1186 sed -i '1i\db\t'$esp6500si_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1187 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500si_colheader_AA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1188 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1189
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1190
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1191 # 6500 ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1192 if [ $version == "esp6500_all" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1193 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1194 ls
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1195 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_all annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1196
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1197 annovarout=annovarinput.${buildver}_esp6500_all_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1198 sed -i '1i\db\t'$esp6500_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'" ' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1199 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1200 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1201
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1202
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1203 # 6500 European American
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1204 if [ $version == "esp6500_ea" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1205 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1206 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_ea annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1207 annovarout=annovarinput.${buildver}_esp6500_ea_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1208 sed -i '1i\db\t'$esp6500_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1209 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_EA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1210 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1211
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1212 # 6500 African Americans
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1213 if [ $version == "esp6500_aa" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1214 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1215 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp6500_aa annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1216
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1217 annovarout=annovarinput.${buildver}_esp6500_aa_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1218 sed -i '1i\db\t'$esp6500_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1219 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp6500_colheader_AA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1220 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1221
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1222
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1223 # 5400 ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1224 if [ $version == "esp5400_all" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1225 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1226 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_all annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1227
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1228 annovarout=annovarinput.${buildver}_esp5400_all_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1229 sed -i '1i\db\t'$esp5400_colheader_ALL'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1230 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_ALL
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1231 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1232
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1233
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1234 # 5400 European American
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1235 if [ $version == "esp5400_ea" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1236 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1237 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_ea annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1238
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1239 annovarout=annovarinput.${buildver}_esp5400_ea_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1240 sed -i '1i\db\t'$esp5400_colheader_EA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1241 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_EA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1242 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1243
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1244 # 5400 African Americans
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1245 if [ $version == "esp5400_aa" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1246 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1247 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype esp5400_aa annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1248
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1249 annovarout=annovarinput.${buildver}_esp5400_aa_dropped
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1250 sed -i '1i\db\t'$esp5400_colheader_AA'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1251 joinresults originalfile $annovarout 3 4 5 6 7 B.$esp5400_colheader_AA
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1252 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1253
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1254 done
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1255 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1256
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1257
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1258 #ExAC-03 database
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1259 if [ $exac03 == "Y" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1260 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1261 echo -e "\nExAC03 Annotation"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1262 $scriptsdir/annotate_variation.pl --filter -otherinfo --buildver $buildver --otherinfo -dbtype exac03 annovarinput $humandb 2>&1
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1263
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1264 #annovarout=annovarinput.${buildver}_exac03_dropped
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1265
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1266 # split allelefrequency column into several columns, one per population
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1267 awk 'BEGIN{FS="\t"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1268 OFS="\t"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1269 }{
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1270 gsub(",","\t",$2)
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1271 print $0
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1272 }END{}' annovarinput.${buildver}_exac03_dropped > $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1273
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1274 sed -i '1i\db\tExAC_Freq\tExAC_AFR\tExAC_AMR\tExAC_EAS\tExAC_FIN\tExAC_NFE\tExAC_OTH\tExAC_SAS\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1275 joinresults originalfile $annovarout 10 11 12 13 14 B.ExAC_Freq,B.ExAC_AFR,B.ExAC_AMR,B.ExAC_EAS,B.ExAC_FIN,B.ExAC_NFE,B.ExAC_OTH,B.ExAC_SAS
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1276 fi
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1277
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1278 #GoNL database
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1279 if [ $gonl == "Y" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1280 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1281
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1282 if [ $buildver == "hg19" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1283 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1284 echo -e "\nGoNL Annotation"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1285 $scriptsdir/annotate_variation.pl --filter --buildver $buildver --otherinfo -dbtype generic -genericdbfile ${buildver}_gonl.txt annovarinput $humandb 2>&1
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1286
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1287 ls
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1288 annovarout=annovarinput.${buildver}_generic_dropped
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1289
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1290 head $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1291
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1292 sed -i '1i\db\tGoNL\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1293 joinresults originalfile $annovarout 3 4 5 6 7 B.GoNL
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1294
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1295 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1296
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1297 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1298
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1299 #SPIDEX database
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1300 if [ $spidex == "Y" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1301 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1302
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1303 if [ $buildver == "hg19" ]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1304 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1305 echo -e "\nSPIDEX Annotation"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1306 $scriptsdir/annotate_variation.pl --filter --buildver $buildver --otherinfo -dbtype spidex annovarinput $humandb 2>&1
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1307
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1308 # split allelefrequency column into several columns, one per population
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1309 awk 'BEGIN{FS="\t"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1310 OFS="\t"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1311 }{
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1312 gsub(",","\t",$2)
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1313 print $0
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1314 }END{}' annovarinput.${buildver}_spidex_dropped > $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1315
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1316 #annovarout=annovarinput.${buildver}_spidex_dropped
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1317 #head $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1318
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1319 sed -i '1i\db\tSPIDEX_dpsi_max_tissue\tSPIDEX_dpsi_zscore\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1320 joinresults originalfile $annovarout 4 5 6 7 8 B.SPIDEX_dpsi_max_tissue,B.SPIDEX_dpsi_zscore
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1321
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1322 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1323
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1324 fi
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1325
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1326
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1327 #GERP++
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1328 if [ $gerp == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1329 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1330 echo -e "\nGERP++ Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1331 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype gerp++gt2 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1332
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1333 annovarout="annovarinput.${buildver}_gerp++gt2_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1334 sed -i '1i\db\tGERP++\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1335 joinresults originalfile $annovarout 3 4 5 6 7 B.GERP++
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1336 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1337
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1338
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1339 #COSMIC
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1340 if [[ $cosmic61 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1341 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1342 echo -e "\nCOSMIC61 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1343 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic61 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1344
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1345 annovarout="annovarinput.${buildver}_cosmic61_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1346 sed -i '1i\db\tCOSMIC61\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1347 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC61
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1348
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1349 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1350
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1351 if [[ $cosmic63 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1352 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1353 echo -e "\nCOSMIC63 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1354 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic63 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1355
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1356 annovarout="annovarinput.${buildver}_cosmic63_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1357 sed -i '1i\db\tCOSMIC63\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1358 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC63
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1359
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1360 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1361
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1362 if [[ $cosmic64 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1363 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1364 echo -e "\nCOSMIC64 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1365 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic64 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1366
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1367 annovarout="annovarinput.${buildver}_cosmic64_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1368 sed -i '1i\db\tCOSMIC64\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1369 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC64
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1370
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1371 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1372
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1373 if [[ $cosmic65 == "Y" && $buildver == "hg19" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1374 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1375 echo -e "\nCOSMIC65 Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1376 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic65 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1377
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1378 annovarout="annovarinput.${buildver}_cosmic65_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1379 sed -i '1i\db\tCOSMIC65\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1380 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC65
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1381
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1382 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1383
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1384 if [[ $cosmic67 == "Y" && $buildver == "hg19" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1385 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1386 echo -e "\nCOSMIC67 Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1387 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic67 annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1388
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1389 annovarout="annovarinput.${buildver}_cosmic67_dropped"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1390 sed -i '1i\db\tCOSMIC67\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1391 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC67
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1392
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1393 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1394
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1395 if [[ $cosmic68 == "Y" && $buildver == "hg19" ]]
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1396 then
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1397 echo -e "\nCOSMIC68 Annotation"
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1398 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic68 annovarinput $humandb 2>&1
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1399
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1400 annovarout="annovarinput.${buildver}_cosmic68_dropped"
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1401 sed -i '1i\db\tCOSMIC68\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1402 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC68
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1403
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1404 fi
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1405
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1406 if [[ $cosmic70 == "Y" && $buildver == "hg19" ]]
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1407 then
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1408 echo -e "\nCOSMIC70 Annotation"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1409 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cosmic70 annovarinput $humandb 2>&1
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1410
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1411 annovarout="annovarinput.${buildver}_cosmic70_dropped"
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1412 sed -i '1i\db\tCOSMIC70\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1413 joinresults originalfile $annovarout 3 4 5 6 7 B.COSMIC70
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1414
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1415 fi
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1416
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1417 if [[ $clinvar == "Y" && $buildver == "hg19" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1418 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1419 echo -e "\nCLINVAR Annotation"
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1420 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype clinvar_20140211 annovarinput $humandb 2>&1
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1421
3
ff5325029a8e Uploaded
saskia-hiltemann
parents: 2
diff changeset
1422 annovarout="annovarinput.${buildver}_clinvar_20140211_dropped"
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1423 sed -i '1i\db\tCLINVAR\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1424 joinresults originalfile $annovarout 3 4 5 6 7 B.CLINVAR
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1425
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1426 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1427
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1428 if [[ $nci60 == "Y" && $buildver == "hg19" ]]
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1429 then
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1430 echo -e "\nNCI60 Annotation"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1431 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype nci60 annovarinput $humandb 2>&1
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1432
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1433 annovarout="annovarinput.${buildver}_nci60_dropped"
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1434 sed -i '1i\db\tNCI60\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1435 joinresults originalfile $annovarout 3 4 5 6 7 B.NCI60
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1436
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1437 fi
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1438
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1439 #cg46
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1440 if [[ $cg46 == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1441 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1442 echo -e "\nCG 46 genomes Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1443 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cg46 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1444
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1445 annovarout="annovarinput.${buildver}_cg46_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1446 sed -i '1i\db\t'${cg46_colheader}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1447 joinresults originalfile $annovarout 3 4 5 6 7 B.${cg46_colheader}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1448
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1449 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1450
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1451
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1452 #cg69
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1453 if [[ $cg69 == "Y" ]]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1454 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1455 echo -e "\nCG 69 genomes Annotation"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1456 $scriptsdir/annotate_variation.pl --filter --buildver $buildver -dbtype cg69 annovarinput $humandb 2>&1
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1457
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1458 annovarout="annovarinput.${buildver}_cg69_dropped"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1459 sed -i '1i\db\t'${cg69_colheader}'\tchromosome\tstart\tend\treference\talleleSeq"'"$vcfheader"'"' $annovarout
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1460 joinresults originalfile $annovarout 3 4 5 6 7 B.${cg69_colheader}
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1461
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1462 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1463
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1464
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1465
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1466 if [ $convertcoords == "Y" ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1467 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1468 echo "converting back coordinates"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1469 awk 'BEGIN{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1470 FS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1471 OFS="\t";
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1472 }{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1473 if (FNR==1)
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1474 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1475 if(FNR>1) {
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1476 $"'"${chrcol}"'" = "chr"$"'"${chrcol}"'"
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1477 if( $"'"${vartypecol}"'" == "snp" ){ $"'"${startcol}"'" -= 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1478 if( $"'"${vartypecol}"'" == "ins" ){ $"'"${refcol}"'" = "" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1479 if( $"'"${vartypecol}"'" == "del" ){ $"'"${startcol}"'" -=1; $"'"${obscol}"'" = "" };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1480 if( $"'"${vartypecol}"'" == "sub" ){ $"'"${startcol}"'" -= 1 };
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1481 print $0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1482
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1483 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1484 }
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1485 END{
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1486 }' originalfile > originalfile_coords
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1487 else
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1488 mv originalfile originalfile_coords
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1489 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1490
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1491 #restore "chr" prefix?
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1492
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1493 #move to outputfile
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1494 if [ ! -s annovarinput.invalid_input ]
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1495 then
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1496 echo "Congrats, your input file contained no invalid lines!" > annovarinput.invalid_input
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1497 fi
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1498
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1499 cp originalfile_coords $outfile_all
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1500 cp annovarinput.invalid_input $outfile_invalid 2>&1
5
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1501
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1502 sed -i 's/chrchr/chr/g' $outfile_all
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1503 sed -i 's/chrchr/chr/g' $outfile_invalid
4600be69b96f Added databases 1000g2015aug, SPIDEX, avsnp138, avsnp142, exac03
saskia-hiltemann
parents: 3
diff changeset
1504
0
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1505 fi #if $dorunannovar
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1506
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1507
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1508
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1509
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1510
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1511
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1512
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1513
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1514
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1515
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1516
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1517
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1518
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1519
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1520
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1521
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1522
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1523
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1524
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1525
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1526
d3a72e55deca Uploaded
saskia-hiltemann
parents:
diff changeset
1527
2
565c0e690238 Added support for LJB2, COSMIC67, CLINVAR and NCI60.
saskia-hiltemann
parents: 0
diff changeset
1528