comparison report_clonality/r_wrapper.sh @ 5:bcec7bb4e089 draft

Uploaded
author davidvanzessen
date Mon, 12 Dec 2016 05:22:57 -0500
parents
children 8cbc1a8d27ae
comparison
equal deleted inserted replaced
4:5ffd52fc35c4 5:bcec7bb4e089
1 #!/bin/bash
2
3 inputFile=$1
4 outputDir=$3
5 outputFile=$3/index.html #$2
6 clonalType=$4
7 species=$5
8 locus=$6
9 filterproductive=$7
10 clonality_method=$8
11
12 dir="$(cd "$(dirname "$0")" && pwd)"
13 useD="false"
14 if grep -q "$species.*${locus}D" "$dir/genes.txt" ; then
15 echo "species D region in reference db"
16 useD="true"
17 fi
18 echo "$species"
19 if [[ "$species" == *"custom"* ]] ; then
20 loci=(${locus//;/ })
21 useD="true"
22 echo "${loci[@]}"
23 if [[ "${#loci[@]}" -eq "2" ]] ; then
24 useD="false"
25 fi
26 fi
27 mkdir $3
28 cp $dir/genes.txt $outputDir
29 Rscript --verbose $dir/RScript.r $inputFile $outputDir $outputDir $clonalType "$species" "$locus" $filterproductive ${clonality_method} 2>&1
30 cp $dir/tabber.js $outputDir
31 cp $dir/style.css $outputDir
32 cp $dir/script.js $outputDir
33 cp $dir/jquery-1.11.0.min.js $outputDir
34 cp $dir/pure-min.css $outputDir
35 samples=`cat $outputDir/samples.txt`
36
37 echo "<html><center><h1><a href='index.html'>Click here for the results</a></h1>Tip: Open it in a new tab (middle mouse button or right mouse button -> 'open in new tab' on the link above)<br />" > $2
38 echo "<table border = 1>" >> $2
39 echo "<thead><tr><th>Sample/Replicate</th><th>All</th><th>Productive</th><th>Unique Productive</th><th>Unproductive</th><th>Unique Unproductive</th></tr></thead>" >> $2
40 while IFS=, read sample all productive perc_prod productive_unique perc_prod_un unproductive perc_unprod unproductive_unique perc_unprod_un
41 do
42 echo "<tr><td>$sample</td>" >> $2
43 echo "<td>$all</td>" >> $2
44 echo "<td>$productive (${perc_prod}%)</td>" >> $2
45 echo "<td>$productive_unique (${perc_prod_un}%)</td>" >> $2
46 echo "<td>$unproductive (${perc_unprod}%)</td>" >> $2
47 echo "<td>$unproductive_unique (${perc_unprod_un}%)</td></tr>" >> $2
48 done < $outputDir/productive_counting.txt
49 echo "</table border></center></html>" >> $2
50
51 echo "<html><head><title>Report on:" >> $outputFile
52
53 mkdir $outputDir/circos
54 cp $dir/circos/* $outputDir/circos/
55 #CIRCOSTOOLS="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/circos-tools-0.21/tools"
56 #CIRCOSDIR="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/bin/"
57
58 #CIRCOSTOOLS="/home/galaxy/circos/circos-tools-0.22/tools"
59 #CIRCOSDIR="/home/galaxy/Anaconda3/bin"
60
61 USECIRCOS="no"
62 if [ -d "$CIRCOSDIR" ]; then
63 USECIRCOS="yes"
64 else
65 if [ -d "/home/galaxy/Anaconda3/bin" ]; then #hopefully temporary fix
66 USECIRCOS="yes"
67 CIRCOSTOOLS="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/circos-tools-0.21/tools"
68 CIRCOSDIR="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/bin/"
69 fi
70 fi
71 echo "Using Circos: $USECIRCOS"
72 sed -i "s%DATA_DIR%$outputDir/circos%" $outputDir/circos/circos.conf
73 for sample in $samples; do #output the samples to a file and create the circos plots with the R script output
74 echo " $sample" >> $outputFile
75
76 if [[ "$USECIRCOS" != "yes" ]]; then
77 continue
78 fi
79
80 circos_file="$outputDir/${sample}_VJ_circos.txt"
81 echo -e -n "labels$(cat ${circos_file})" > ${circos_file}
82 cat "${circos_file}" | $CIRCOSTOOLS/tableviewer/bin/parse-table -configfile $dir/circos/parse-table.conf 2>&1 | $CIRCOSTOOLS/tableviewer/bin/make-conf -dir $outputDir/circos/
83 $CIRCOSDIR/circos -conf $outputDir/circos/circos.conf 2>&1
84 mv $outputDir/circos/circos.png $outputDir/circosVJ_${sample}.png
85
86
87 if [[ "$useD" == "true" ]] ; then
88 circos_file="$outputDir/${sample}_VD_circos.txt"
89 echo -e -n "labels$(cat ${circos_file})" > ${circos_file}
90 cat "${circos_file}" | $CIRCOSTOOLS/tableviewer/bin/parse-table -configfile $dir/circos/parse-table.conf 2>&1 | $CIRCOSTOOLS/tableviewer/bin/make-conf -dir $outputDir/circos/
91 $CIRCOSDIR/circos -conf $outputDir/circos/circos.conf 2>&1
92 mv $outputDir/circos/circos.png $outputDir/circosVD_${sample}.png
93
94 circos_file="$outputDir/${sample}_DJ_circos.txt"
95 echo -e -n "labels$(cat ${circos_file})" > ${circos_file}
96 cat "${circos_file}" | $CIRCOSTOOLS/tableviewer/bin/parse-table -configfile $dir/circos/parse-table.conf 2>&1 | $CIRCOSTOOLS/tableviewer/bin/make-conf -dir $outputDir/circos/
97 $CIRCOSDIR/circos -conf $outputDir/circos/circos.conf 2>&1
98 mv $outputDir/circos/circos.png $outputDir/circosDJ_${sample}.png
99
100 fi
101 done
102 echo "</title><script type='text/javascript' src='jquery-1.11.0.min.js'></script>" >> $outputFile
103 echo "<link rel='stylesheet' type='text/css' href='pure-min.css'>" >> $outputFile
104 echo "<script type='text/javascript' src='tabber.js'></script>" >> $outputFile
105 echo "<script type='text/javascript' src='script.js'></script>" >> $outputFile
106 echo "<link rel='stylesheet' type='text/css' href='style.css'></head>" >> $outputFile
107 echo "<div class='tabber'><div class='tabbertab' title='Gene frequencies'>" >> $outputFile
108
109 echo "<img src='CDR3LengthPlot.png'/><br />" >> $outputFile
110 echo "<img src='VFPlot.png'/>" >> $outputFile
111 if [[ "$useD" == "true" ]] ; then
112 echo "<img src='DFPlot.png'/>" >> $outputFile
113 fi
114 echo "<img src='VPlot.png'/>" >> $outputFile
115 if [[ "$useD" == "true" ]] ; then
116 echo "<img src='DPlot.png'/>" >> $outputFile
117 fi
118 echo "<img src='JPlot.png'/>" >> $outputFile
119 echo "<img src='AAComposition.png'/>" >> $outputFile
120 echo "<img src='DReadingFrame.png'/>" >> $outputFile
121 echo "</div>" >> $outputFile
122
123 #Heatmaps
124
125 count=1
126 echo "<div class='tabbertab' title='Heatmaps'><div class='tabber'>" >> $outputFile
127 for sample in $samples; do
128 echo "<div class='tabbertab' title='$sample'><table border='1'><tr>" >> $outputFile
129 if [[ "$useD" == "true" ]] ; then
130 echo "<td><img src='HeatmapVD_$sample.png'/></td>" >> $outputFile
131 fi
132 echo "<td><img src='HeatmapVJ_$sample.png'/></td>" >> $outputFile
133 if [[ "$useD" == "true" ]] ; then
134 echo "<td><img src='HeatmapDJ_$sample.png'/></td>" >> $outputFile
135 fi
136 echo "</tr></table></div>" >> $outputFile
137 count=$((count+1))
138 done
139 echo "</div></div>" >> $outputFile
140
141 #circos
142
143 if [[ "$USECIRCOS" == "yes" ]]; then
144
145 echo "<div class='tabbertab' title='Circos'><div class='tabber'>" >> $outputFile
146 for sample in $samples; do
147 echo "<div class='tabbertab' title='$sample'><table border='1'><center>" >> $outputFile
148 if [[ "$useD" == "true" ]] ; then
149 echo "<tr><td>V-D</td><td><img src='circosVD_${sample}.png' width='700' height='700'/></td></tr>" >> $outputFile
150 fi
151 echo "<tr><td>V-J</td><td><img src='circosVJ_${sample}.png' width='700' height='700'/></td></tr>" >> $outputFile
152 if [[ "$useD" == "true" ]] ; then
153 echo "<tr><td>D-J</td><td><img src='circosDJ_${sample}.png' width='700' height='700'/></td></tr>" >> $outputFile
154 fi
155 echo "<center></table></div>" >> $outputFile
156 count=$((count+1))
157 done
158 echo "</div></div>" >> $outputFile
159 fi
160 #echo "<div class='tabbertab' title='Interactive'><svg class='chart'></svg><script src='http://d3js.org/d3.v3.min.js'></script></div>" >> $outputFile
161
162 hasReplicateColumn="$(if head -n 1 $inputFile | grep -q 'Replicate'; then echo 'Yes'; else echo 'No'; fi)"
163 echo "$hasReplicateColumn"
164 #if its a 'new' merged file with replicate info
165 if [[ "$hasReplicateColumn" == "Yes" ]] ; then
166 echo "<div class='tabbertab' title='Clonality'><div class='tabber'>" >> $outputFile
167 for sample in $samples; do
168 echo "${clonality_method}"
169 if [[ "${clonality_method}" == "old" ]] ; then
170 echo "in old"
171 clonalityScore="$(cat $outputDir/ClonalityScore_$sample.csv)"
172 echo "<div class='tabbertab' title='$sample'><table class='pure-table pure-table-striped'>" >> $outputFile
173 echo "<thead><tr><th colspan='4'>Clonality Score: $clonalityScore</th></tr></thead>" >> $outputFile
174
175 #replicate,reads,squared
176 echo "<tr><td>Replicate ID</td><td>Number of Reads</td><td>Reads Squared</td><td></td></tr>" >> $outputFile
177 while IFS=, read replicate reads squared
178 do
179 echo "<tr><td>$replicate</td><td>$reads</td><td>$squared</td><td></td></tr>" >> $outputFile
180 done < $outputDir/ReplicateReads_$sample.csv
181
182 #sum of reads and reads squared
183 while IFS=, read readsSum squaredSum
184 do
185 echo "<tr><td>Sum</td><td>$readsSum</td><td>$squaredSum</td></tr>" >> $outputFile
186 done < $outputDir/ReplicateSumReads_$sample.csv
187
188 #overview
189 echo "<tr><td>Coincidence Type</td><td>Raw Coincidence Freq</td><td>Coincidence Weight</td><td>Coincidences, Weighted</td></tr>" >> $outputFile
190 while IFS=, read type count weight weightedCount
191 do
192 if [[ "$type" -eq "1" ]]; then
193 echo "<tr><td>$type</td><td>$count</td><td>$weight</td><td>$weightedCount</td></tr>" >> $outputFile
194 else
195 echo "<tr><td><a href='coincidences_${sample}_${type}.txt'>$type</a></td><td>$count</td><td>$weight</td><td>$weightedCount</td></tr>" >> $outputFile
196 fi
197
198 done < $outputDir/ClonalityOverView_$sample.csv
199 echo "</table></div>" >> $outputFile
200 else
201 echo "in new"
202 clonalityScore="$(cat $outputDir/lymphclon_clonality_${sample}.csv)"
203 echo "<div class='tabbertab' title='$sample'>" >> $outputFile
204 echo "Lymphclon clonality score: <br />$clonalityScore<br /><br />" >> $outputFile
205 echo "<table border = 1>" >> $outputFile
206 while IFS=, read type count
207 do
208 echo "<tr><td>$type</td><td>$count</td></tr>" >> $outputFile
209 done < $outputDir/lymphclon_coincidences_$sample.csv
210 echo "</table></div>" >> $outputFile
211 fi
212 done
213 echo "</div></div>" >> $outputFile
214 fi
215
216 #hasJunctionData="$(if head -n 1 $inputFile | grep -qE '3V.REGION.trimmed.nt.nb'; then echo 'Yes'; else echo 'No'; fi)"
217
218 #if [[ "$hasJunctionData" == "Yes" ]] ; then
219 if [ -a "$outputDir/junctionAnalysisProd_mean.csv" ] ; then
220 echo "<div class='tabbertab' title='Junction Analysis'>" >> $outputFile
221 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Productive mean</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile
222 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median
223 do
224 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile
225 done < $outputDir/junctionAnalysisProd_mean.csv
226 echo "</tbody></table>" >> $outputFile
227
228 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Unproductive mean</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile
229 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median
230 do
231 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile
232 done < $outputDir/junctionAnalysisUnProd_mean.csv
233 echo "</tbody></table>" >> $outputFile
234
235 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Productive median</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile
236 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median
237 do
238 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile
239 done < $outputDir/junctionAnalysisProd_median.csv
240 echo "</tbody></table>" >> $outputFile
241
242 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Unproductive median</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile
243 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median
244 do
245 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile
246 done < $outputDir/junctionAnalysisUnProd_median.csv
247 echo "</tbody></table>" >> $outputFile
248
249 echo "</div>" >> $outputFile
250 fi
251
252 echo "<div class='tabbertab' title='Comparison'><table class='pure-table pure-table-striped'><thead><tr><th>ID</th><th>Include</th></tr></thead>" >> $outputFile
253 for sample in $samples; do
254 echo "<tr><td>$sample</td><td><input type='checkbox' onchange=\"javascript:compareAdd('$sample')\" id='compare_checkbox_$sample'/></td></tr>" >> $outputFile
255 done
256 echo "</table><div name='comparisonarea'>" >> $outputFile
257 echo "<table><tr id='comparison_table_vd'></tr></table>" >> $outputFile
258 echo "<table><tr id='comparison_table_vj'></tr></table>" >> $outputFile
259 echo "<table><tr id='comparison_table_dj'></tr></table>" >> $outputFile
260 echo "</div></div>" >> $outputFile
261
262 echo "<div class='tabbertab' title='Downloads'>" >> $outputFile
263 echo "<table class='pure-table pure-table-striped'>" >> $outputFile
264 echo "<thead><tr><th>Description</th><th>Link</th></tr></thead>" >> $outputFile
265 echo "<tr><td>The dataset used to generate the frequency graphs and the heatmaps (Unique based on clonaltype, $clonalType)</td><td><a href='allUnique.csv'>Download</a></td></tr>" >> $outputFile
266 echo "<tr><td>The dataset used to calculate clonality score (Unique based on clonaltype, $clonalType)</td><td><a href='clonalityComplete.csv'>Download</a></td></tr>" >> $outputFile
267
268 echo "<tr><td>The dataset used to generate the CDR3 length frequency graph</td><td><a href='CDR3LengthPlot.csv'>Download</a></td></tr>" >> $outputFile
269
270 echo "<tr><td>The dataset used to generate the V gene family frequency graph</td><td><a href='VFFrequency.csv'>Download</a></td></tr>" >> $outputFile
271 if [[ "$useD" == "true" ]] ; then
272 echo "<tr><td>The dataset used to generate the D gene family frequency graph</td><td><a href='DFFrequency.csv'>Download</a></td></tr>" >> $outputFile
273 fi
274
275 echo "<tr><td>The dataset used to generate the V gene frequency graph</td><td><a href='VFrequency.csv'>Download</a></td></tr>" >> $outputFile
276 if [[ "$useD" == "true" ]] ; then
277 echo "<tr><td>The dataset used to generate the D gene frequency graph</td><td><a href='DFrequency.csv'>Download</a></td></tr>" >> $outputFile
278 fi
279 echo "<tr><td>The dataset used to generate the J gene frequency graph</td><td><a href='JFrequency.csv'>Download</a></td></tr>" >> $outputFile
280 echo "<tr><td>The dataset used to generate the AA composition graph</td><td><a href='AAComposition.csv'>Download</a></td></tr>" >> $outputFile
281
282 for sample in $samples; do
283 if [[ "$useD" == "true" ]] ; then
284 echo "<tr><td>The data used to generate the VD heatmap for $sample.</td><td><a href='HeatmapVD_$sample.csv'>Download</a></td></tr>" >> $outputFile
285 fi
286 echo "<tr><td>The data used to generate the VJ heatmap for $sample.</td><td><a href='HeatmapVJ_$sample.csv'>Download</a></td></tr>" >> $outputFile
287 if [[ "$useD" == "true" ]] ; then
288 echo "<tr><td>The data used to generate the DJ heatmap for $sample.</td><td><a href='HeatmapDJ_$sample.csv'>Download</a></td></tr>" >> $outputFile
289 fi
290 done
291
292 echo "<tr><td>A frequency count of V Gene + J Gene + CDR3</td><td><a href='VJCDR3_count.txt'>Download</a></td></tr>" >> $outputFile
293
294 echo "</table>" >> $outputFile
295 echo "</div></html>" >> $outputFile