Mercurial > repos > davidvanzessen > argalaxy_tools
comparison report_clonality/r_wrapper.sh.old @ 20:9185c3dfc679 draft
Uploaded
author | davidvanzessen |
---|---|
date | Fri, 27 Jan 2017 03:44:18 -0500 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
19:3ef457aa5df6 | 20:9185c3dfc679 |
---|---|
1 #!/bin/bash | |
2 | |
3 inputFile=$1 | |
4 outputDir=$3 | |
5 outputFile=$3/index.html #$2 | |
6 clonalType=$4 | |
7 species=$5 | |
8 locus=$6 | |
9 filterproductive=$7 | |
10 clonality_method=$8 | |
11 | |
12 dir="$(cd "$(dirname "$0")" && pwd)" | |
13 useD="false" | |
14 if grep -q "$species.*${locus}D" "$dir/genes.txt" ; then | |
15 echo "species D region in reference db" | |
16 useD="true" | |
17 fi | |
18 echo "$species" | |
19 if [[ "$species" == *"custom"* ]] ; then | |
20 loci=(${locus//;/ }) | |
21 useD="true" | |
22 echo "${loci[@]}" | |
23 if [[ "${#loci[@]}" -eq "2" ]] ; then | |
24 useD="false" | |
25 fi | |
26 fi | |
27 mkdir $3 | |
28 cp $dir/genes.txt $outputDir | |
29 Rscript --verbose $dir/RScript.r $inputFile $outputDir $outputDir $clonalType "$species" "$locus" $filterproductive ${clonality_method} 2>&1 | |
30 cp $dir/tabber.js $outputDir | |
31 cp $dir/style.css $outputDir | |
32 cp $dir/script.js $outputDir | |
33 cp $dir/jquery-1.11.0.min.js $outputDir | |
34 cp $dir/pure-min.css $outputDir | |
35 samples=`cat $outputDir/samples.txt` | |
36 | |
37 echo "<html><center><h1><a href='index.html'>Click here for the results</a></h1>Tip: Open it in a new tab (middle mouse button or right mouse button -> 'open in new tab' on the link above)<br />" > $2 | |
38 echo "<table border = 1>" >> $2 | |
39 echo "<thead><tr><th>Sample/Replicate</th><th>All</th><th>Productive</th><th>Unique Productive</th><th>Unproductive</th><th>Unique Unproductive</th></tr></thead>" >> $2 | |
40 while IFS=, read sample all productive perc_prod productive_unique perc_prod_un unproductive perc_unprod unproductive_unique perc_unprod_un | |
41 do | |
42 echo "<tr><td>$sample</td>" >> $2 | |
43 echo "<td>$all</td>" >> $2 | |
44 echo "<td>$productive (${perc_prod}%)</td>" >> $2 | |
45 echo "<td>$productive_unique (${perc_prod_un}%)</td>" >> $2 | |
46 echo "<td>$unproductive (${perc_unprod}%)</td>" >> $2 | |
47 echo "<td>$unproductive_unique (${perc_unprod_un}%)</td></tr>" >> $2 | |
48 done < $outputDir/productive_counting.txt | |
49 echo "</table border></center></html>" >> $2 | |
50 | |
51 echo "<html><head><title>Report on:" >> $outputFile | |
52 | |
53 mkdir $outputDir/circos | |
54 cp $dir/circos/* $outputDir/circos/ | |
55 #CIRCOSTOOLS="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/circos-tools-0.21/tools" | |
56 #CIRCOSDIR="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/bin/" | |
57 | |
58 #CIRCOSTOOLS="/home/galaxy/circos/circos-tools-0.22/tools" | |
59 #CIRCOSDIR="/home/galaxy/Anaconda3/bin" | |
60 | |
61 USECIRCOS="no" | |
62 if [ -d "$CIRCOSDIR" ]; then | |
63 USECIRCOS="yes" | |
64 else | |
65 if [ -d "/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/bin/" ]; then #hopefully temporary fix | |
66 USECIRCOS="yes" | |
67 CIRCOSTOOLS="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/circos-tools-0.21/tools" | |
68 CIRCOSDIR="/data/galaxy/galaxy-dist/toolsheddependencies/circos/0.64/saskia-hiltemann/cg_circos_plots/bbfdd52d64fd/bin/" | |
69 fi | |
70 | |
71 if [ -d "/home/galaxy/Anaconda3/bin" ]; then #hopefully temporary fix | |
72 USECIRCOS="yes" | |
73 CIRCOSTOOLS="/home/galaxy/circos/circos-tools-0.22/tools" | |
74 CIRCOSDIR="/home/galaxy/Anaconda3/bin" | |
75 fi | |
76 fi | |
77 | |
78 echo "Using Circos: $USECIRCOS" | |
79 sed -i "s%DATA_DIR%$outputDir/circos%" $outputDir/circos/circos.conf | |
80 for sample in $samples; do #output the samples to a file and create the circos plots with the R script output | |
81 echo " $sample" >> $outputFile | |
82 | |
83 if [[ "$USECIRCOS" != "yes" ]]; then | |
84 continue | |
85 fi | |
86 | |
87 circos_file="$outputDir/${sample}_VJ_circos.txt" | |
88 echo -e -n "labels$(cat ${circos_file})" > ${circos_file} | |
89 cat "${circos_file}" | $CIRCOSTOOLS/tableviewer/bin/parse-table -configfile $dir/circos/parse-table.conf 2>&1 | $CIRCOSTOOLS/tableviewer/bin/make-conf -dir $outputDir/circos/ | |
90 $CIRCOSDIR/circos -conf $outputDir/circos/circos.conf 2>&1 | |
91 mv $outputDir/circos/circos.png $outputDir/circosVJ_${sample}.png | |
92 | |
93 | |
94 if [[ "$useD" == "true" ]] ; then | |
95 circos_file="$outputDir/${sample}_VD_circos.txt" | |
96 echo -e -n "labels$(cat ${circos_file})" > ${circos_file} | |
97 cat "${circos_file}" | $CIRCOSTOOLS/tableviewer/bin/parse-table -configfile $dir/circos/parse-table.conf 2>&1 | $CIRCOSTOOLS/tableviewer/bin/make-conf -dir $outputDir/circos/ | |
98 $CIRCOSDIR/circos -conf $outputDir/circos/circos.conf 2>&1 | |
99 mv $outputDir/circos/circos.png $outputDir/circosVD_${sample}.png | |
100 | |
101 circos_file="$outputDir/${sample}_DJ_circos.txt" | |
102 echo -e -n "labels$(cat ${circos_file})" > ${circos_file} | |
103 cat "${circos_file}" | $CIRCOSTOOLS/tableviewer/bin/parse-table -configfile $dir/circos/parse-table.conf 2>&1 | $CIRCOSTOOLS/tableviewer/bin/make-conf -dir $outputDir/circos/ | |
104 $CIRCOSDIR/circos -conf $outputDir/circos/circos.conf 2>&1 | |
105 mv $outputDir/circos/circos.png $outputDir/circosDJ_${sample}.png | |
106 | |
107 fi | |
108 done | |
109 echo "</title><script type='text/javascript' src='jquery-1.11.0.min.js'></script>" >> $outputFile | |
110 echo "<link rel='stylesheet' type='text/css' href='pure-min.css'>" >> $outputFile | |
111 echo "<script type='text/javascript' src='tabber.js'></script>" >> $outputFile | |
112 echo "<script type='text/javascript' src='script.js'></script>" >> $outputFile | |
113 echo "<link rel='stylesheet' type='text/css' href='style.css'></head>" >> $outputFile | |
114 echo "<div class='tabber'><div class='tabbertab' title='Gene frequencies'>" >> $outputFile | |
115 | |
116 | |
117 echo "<img src='VFPlot.png'/>" >> $outputFile | |
118 if [[ "$useD" == "true" ]] ; then | |
119 echo "<img src='DFPlot.png'/>" >> $outputFile | |
120 fi | |
121 echo "<img src='VPlot.png'/>" >> $outputFile | |
122 if [[ "$useD" == "true" ]] ; then | |
123 echo "<img src='DPlot.png'/>" >> $outputFile | |
124 fi | |
125 echo "<img src='JPlot.png'/>" >> $outputFile | |
126 echo "</div>" >> $outputFile | |
127 | |
128 echo "<div class='tabbertab' title='CDR3 Characteristics'>" >> $outputFile | |
129 echo "<img src='CDR3LengthPlot.png'/><br />" >> $outputFile | |
130 echo "<img src='AAComposition.png'/>" >> $outputFile | |
131 echo "<img src='DReadingFrame.png'/>" >> $outputFile | |
132 | |
133 echo "<table class='pure-table pure-table-striped'>" >> $outputFile | |
134 echo "<thead><tr><th>Sample</th><th>Median CDR3 Length</th></tr></thead>" >> $outputFile | |
135 while IFS=, read Sample median | |
136 do | |
137 echo "<tr><td>$Sample</td><td>$median</td></tr>" >> $outputFile | |
138 done < $outputDir/AAMedianBySample.csv | |
139 echo "</table>" >> $outputFile | |
140 | |
141 echo "</div>" >> $outputFile | |
142 | |
143 #Heatmaps | |
144 | |
145 count=1 | |
146 echo "<div class='tabbertab' title='Heatmaps'><div class='tabber'>" >> $outputFile | |
147 for sample in $samples; do | |
148 echo "<div class='tabbertab' title='$sample'><table border='1'><tr>" >> $outputFile | |
149 if [[ "$useD" == "true" ]] ; then | |
150 echo "<td><img src='HeatmapVD_$sample.png'/></td>" >> $outputFile | |
151 fi | |
152 echo "<td><img src='HeatmapVJ_$sample.png'/></td>" >> $outputFile | |
153 if [[ "$useD" == "true" ]] ; then | |
154 echo "<td><img src='HeatmapDJ_$sample.png'/></td>" >> $outputFile | |
155 fi | |
156 echo "</tr></table></div>" >> $outputFile | |
157 count=$((count+1)) | |
158 done | |
159 echo "</div></div>" >> $outputFile | |
160 | |
161 #circos | |
162 | |
163 if [[ "$USECIRCOS" == "yes" ]]; then | |
164 | |
165 echo "<div class='tabbertab' title='Circos'><div class='tabber'>" >> $outputFile | |
166 for sample in $samples; do | |
167 echo "<div class='tabbertab' title='$sample'><table border='1'><center>" >> $outputFile | |
168 if [[ "$useD" == "true" ]] ; then | |
169 echo "<tr><td>V-D</td><td><img src='circosVD_${sample}.png' width='700' height='700'/></td></tr>" >> $outputFile | |
170 fi | |
171 echo "<tr><td>V-J</td><td><img src='circosVJ_${sample}.png' width='700' height='700'/></td></tr>" >> $outputFile | |
172 if [[ "$useD" == "true" ]] ; then | |
173 echo "<tr><td>D-J</td><td><img src='circosDJ_${sample}.png' width='700' height='700'/></td></tr>" >> $outputFile | |
174 fi | |
175 echo "<center></table></div>" >> $outputFile | |
176 count=$((count+1)) | |
177 done | |
178 echo "</div></div>" >> $outputFile | |
179 fi | |
180 #echo "<div class='tabbertab' title='Interactive'><svg class='chart'></svg><script src='http://d3js.org/d3.v3.min.js'></script></div>" >> $outputFile | |
181 | |
182 hasReplicateColumn="$(if head -n 1 $inputFile | grep -q 'Replicate'; then echo 'Yes'; else echo 'No'; fi)" | |
183 echo "$hasReplicateColumn" | |
184 #if its a 'new' merged file with replicate info | |
185 if [[ "$hasReplicateColumn" == "Yes" ]] ; then | |
186 echo "<div class='tabbertab' title='Clonality'><div class='tabber'>" >> $outputFile | |
187 for sample in $samples; do | |
188 echo "${clonality_method}" | |
189 if [[ "${clonality_method}" == "old" ]] ; then | |
190 echo "in old" | |
191 clonalityScore="$(cat $outputDir/ClonalityScore_$sample.csv)" | |
192 echo "<div class='tabbertab' title='$sample'><table class='pure-table pure-table-striped'>" >> $outputFile | |
193 echo "<thead><tr><th colspan='4'>Clonality Score: $clonalityScore</th></tr></thead>" >> $outputFile | |
194 | |
195 #replicate,reads,squared | |
196 echo "<tr><td>Replicate ID</td><td>Number of Reads</td></tr>" >> $outputFile | |
197 while IFS=, read replicate reads squared | |
198 do | |
199 echo "<tr><td>$replicate</td><td>$reads</td></tr>" >> $outputFile | |
200 done < $outputDir/ReplicateReads_$sample.csv | |
201 | |
202 #sum of reads and reads squared | |
203 while IFS=, read readsSum squaredSum | |
204 do | |
205 echo "<tr><td>Sum</td><td>$readsSum</td></tr>" >> $outputFile | |
206 done < $outputDir/ReplicateSumReads_$sample.csv | |
207 | |
208 #overview | |
209 echo "<tr><td>Coincidence Type</td><td>Raw Coincidence Freq</td></tr>" >> $outputFile | |
210 while IFS=, read type count weight weightedCount | |
211 do | |
212 if [[ "$type" -eq "1" ]]; then | |
213 echo "<tr><td>$type</td><td>$count</td></tr>" >> $outputFile | |
214 else | |
215 echo "<tr><td><a href='coincidences_${sample}_${type}.txt'>$type</a></td><td>$count</td></tr>" >> $outputFile | |
216 fi | |
217 | |
218 done < $outputDir/ClonalityOverView_$sample.csv | |
219 echo "</table></div>" >> $outputFile | |
220 else | |
221 echo "in new" | |
222 clonalityScore="$(cat $outputDir/lymphclon_clonality_${sample}.csv)" | |
223 echo "<div class='tabbertab' title='$sample'>" >> $outputFile | |
224 echo "Lymphclon clonality score: <br />$clonalityScore<br /><br />" >> $outputFile | |
225 echo "<table border = 1>" >> $outputFile | |
226 while IFS=, read type count | |
227 do | |
228 echo "<tr><td>$type</td><td>$count</td></tr>" >> $outputFile | |
229 done < $outputDir/lymphclon_coincidences_$sample.csv | |
230 echo "</table></div>" >> $outputFile | |
231 fi | |
232 done | |
233 echo "</div></div>" >> $outputFile | |
234 fi | |
235 | |
236 #hasJunctionData="$(if head -n 1 $inputFile | grep -qE '3V.REGION.trimmed.nt.nb'; then echo 'Yes'; else echo 'No'; fi)" | |
237 | |
238 #if [[ "$hasJunctionData" == "Yes" ]] ; then | |
239 if [ -a "$outputDir/junctionAnalysisProd_mean.csv" ] ; then | |
240 echo "<div class='tabbertab' title='Junction Analysis'>" >> $outputFile | |
241 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Productive mean</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile | |
242 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median | |
243 do | |
244 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile | |
245 done < $outputDir/junctionAnalysisProd_mean.csv | |
246 echo "</tbody></table>" >> $outputFile | |
247 | |
248 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Unproductive mean</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile | |
249 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median | |
250 do | |
251 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile | |
252 done < $outputDir/junctionAnalysisUnProd_mean.csv | |
253 echo "</tbody></table>" >> $outputFile | |
254 | |
255 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Productive median</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile | |
256 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median | |
257 do | |
258 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile | |
259 done < $outputDir/junctionAnalysisProd_median.csv | |
260 echo "</tbody></table>" >> $outputFile | |
261 | |
262 echo "<table class='pure-table pure-table-striped' id='junction_table'> <caption>Unproductive median</caption><thead><tr><th>Sample</th><th>count</th><th>V.DEL</th><th>P1</th><th>N1</th><th>P2</th><th>DEL.D</th><th>D.DEL</th><th>P3</th><th>N2</th><th>P4</th><th>DEL.J</th><th>Total.Del</th><th>Total.N</th><th>Total.P</th><th>Median.CDR3</th><thead></tr><tbody>" >> $outputFile | |
263 while IFS=, read Sample unique VDEL P1 N1 P2 DELD DDEL P3 N2 P4 DELJ TotalDel TotalN TotalP median | |
264 do | |
265 echo "<tr><td>$Sample</td><td>$unique</td><td>$VDEL</td><td>$P1</td><td>$N1</td><td>$P2</td><td>$DELD</td><td>$DDEL</td><td>$P3</td><td>$N2</td><td>$P4</td><td>$DELJ</td><td>$TotalDel</td><td>$TotalN</td><td>$TotalP</td><td>$median</td></tr>" >> $outputFile | |
266 done < $outputDir/junctionAnalysisUnProd_median.csv | |
267 echo "</tbody></table>" >> $outputFile | |
268 | |
269 echo "</div>" >> $outputFile | |
270 fi | |
271 | |
272 echo "<div class='tabbertab' title='Comparison'><table class='pure-table pure-table-striped'><thead><tr><th>ID</th><th>Include</th></tr></thead>" >> $outputFile | |
273 for sample in $samples; do | |
274 echo "<tr><td>$sample</td><td><input type='checkbox' onchange=\"javascript:compareAdd('$sample')\" id='compare_checkbox_$sample'/></td></tr>" >> $outputFile | |
275 done | |
276 echo "</table><div name='comparisonarea'>" >> $outputFile | |
277 echo "<table><tr id='comparison_table_vd'></tr></table>" >> $outputFile | |
278 echo "<table><tr id='comparison_table_vj'></tr></table>" >> $outputFile | |
279 echo "<table><tr id='comparison_table_dj'></tr></table>" >> $outputFile | |
280 echo "</div></div>" >> $outputFile | |
281 | |
282 echo "<div class='tabbertab' title='Downloads'>" >> $outputFile | |
283 echo "<table class='pure-table pure-table-striped'>" >> $outputFile | |
284 echo "<thead><tr><th>Description</th><th>Link</th></tr></thead>" >> $outputFile | |
285 echo "<tr><td>The dataset used to generate the frequency graphs and the heatmaps (Unique based on clonaltype, $clonalType)</td><td><a href='allUnique.csv'>Download</a></td></tr>" >> $outputFile | |
286 echo "<tr><td>The dataset used to calculate clonality score (Unique based on clonaltype, $clonalType)</td><td><a href='clonalityComplete.csv'>Download</a></td></tr>" >> $outputFile | |
287 | |
288 echo "<tr><td>The dataset used to generate the CDR3 length frequency graph</td><td><a href='CDR3LengthPlot.csv'>Download</a></td></tr>" >> $outputFile | |
289 | |
290 echo "<tr><td>The dataset used to generate the V gene family frequency graph</td><td><a href='VFFrequency.csv'>Download</a></td></tr>" >> $outputFile | |
291 if [[ "$useD" == "true" ]] ; then | |
292 echo "<tr><td>The dataset used to generate the D gene family frequency graph</td><td><a href='DFFrequency.csv'>Download</a></td></tr>" >> $outputFile | |
293 fi | |
294 | |
295 echo "<tr><td>The dataset used to generate the V gene frequency graph</td><td><a href='VFrequency.csv'>Download</a></td></tr>" >> $outputFile | |
296 if [[ "$useD" == "true" ]] ; then | |
297 echo "<tr><td>The dataset used to generate the D gene frequency graph</td><td><a href='DFrequency.csv'>Download</a></td></tr>" >> $outputFile | |
298 fi | |
299 echo "<tr><td>The dataset used to generate the J gene frequency graph</td><td><a href='JFrequency.csv'>Download</a></td></tr>" >> $outputFile | |
300 echo "<tr><td>The dataset used to generate the AA composition graph</td><td><a href='AAComposition.csv'>Download</a></td></tr>" >> $outputFile | |
301 | |
302 for sample in $samples; do | |
303 if [[ "$useD" == "true" ]] ; then | |
304 echo "<tr><td>The data used to generate the VD heatmap for $sample.</td><td><a href='HeatmapVD_$sample.csv'>Download</a></td></tr>" >> $outputFile | |
305 fi | |
306 echo "<tr><td>The data used to generate the VJ heatmap for $sample.</td><td><a href='HeatmapVJ_$sample.csv'>Download</a></td></tr>" >> $outputFile | |
307 if [[ "$useD" == "true" ]] ; then | |
308 echo "<tr><td>The data used to generate the DJ heatmap for $sample.</td><td><a href='HeatmapDJ_$sample.csv'>Download</a></td></tr>" >> $outputFile | |
309 fi | |
310 done | |
311 | |
312 echo "<tr><td>A frequency count of V Gene + J Gene + CDR3</td><td><a href='VJCDR3_count.txt'>Download</a></td></tr>" >> $outputFile | |
313 | |
314 echo "</table>" >> $outputFile | |
315 echo "</div></html>" >> $outputFile |