annotate MACARON-GenMed-LabEx/MACARON_validate.sh @ 0:c9636a827049 draft default tip

Uploaded
author waqas
date Wed, 12 Sep 2018 08:45:03 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
c9636a827049 Uploaded
waqas
parents:
diff changeset
1 #!/bin/bash
c9636a827049 Uploaded
waqas
parents:
diff changeset
2
c9636a827049 Uploaded
waqas
parents:
diff changeset
3 #sub1.chr22_21349676-21349677.sample02.bam
c9636a827049 Uploaded
waqas
parents:
diff changeset
4
c9636a827049 Uploaded
waqas
parents:
diff changeset
5 bam=$1;
c9636a827049 Uploaded
waqas
parents:
diff changeset
6 name=$(echo $bam | cut -d'.' -f1)
c9636a827049 Uploaded
waqas
parents:
diff changeset
7 region=$(echo $bam | cut -d'.' -f2)
c9636a827049 Uploaded
waqas
parents:
diff changeset
8 sample=$(echo $bam | cut -d'.' -f3)
c9636a827049 Uploaded
waqas
parents:
diff changeset
9
c9636a827049 Uploaded
waqas
parents:
diff changeset
10 chr=$(echo $region | cut -d'_' -f1)
c9636a827049 Uploaded
waqas
parents:
diff changeset
11 pos=$(echo $region | cut -d'_' -f2)
c9636a827049 Uploaded
waqas
parents:
diff changeset
12
c9636a827049 Uploaded
waqas
parents:
diff changeset
13 beg=$(echo $pos | cut -d'-' -f1)
c9636a827049 Uploaded
waqas
parents:
diff changeset
14 end=$(echo $pos | cut -d'-' -f2)
c9636a827049 Uploaded
waqas
parents:
diff changeset
15
c9636a827049 Uploaded
waqas
parents:
diff changeset
16 #beg=$(($beg+50))
c9636a827049 Uploaded
waqas
parents:
diff changeset
17 #end=$((end-50))
c9636a827049 Uploaded
waqas
parents:
diff changeset
18
c9636a827049 Uploaded
waqas
parents:
diff changeset
19 #echo "name $name"
c9636a827049 Uploaded
waqas
parents:
diff changeset
20 #echo "region $region"
c9636a827049 Uploaded
waqas
parents:
diff changeset
21 #echo "sample $sample"
c9636a827049 Uploaded
waqas
parents:
diff changeset
22
c9636a827049 Uploaded
waqas
parents:
diff changeset
23 echo "$name $chr:$beg-$end $sample"
c9636a827049 Uploaded
waqas
parents:
diff changeset
24 echo "$name $chr:$beg-$end $sample" >> MACARON_validate.txt
c9636a827049 Uploaded
waqas
parents:
diff changeset
25
c9636a827049 Uploaded
waqas
parents:
diff changeset
26 samtools view $bam | awk -v start=$beg -v stop=$end '
c9636a827049 Uploaded
waqas
parents:
diff changeset
27 {
c9636a827049 Uploaded
waqas
parents:
diff changeset
28 pos=$4;
c9636a827049 Uploaded
waqas
parents:
diff changeset
29 if(pos < start){
c9636a827049 Uploaded
waqas
parents:
diff changeset
30 cstart=1+start-pos;
c9636a827049 Uploaded
waqas
parents:
diff changeset
31 cstop=1+stop-pos;
c9636a827049 Uploaded
waqas
parents:
diff changeset
32 print cstart"."cstop"."$10;
c9636a827049 Uploaded
waqas
parents:
diff changeset
33 }
c9636a827049 Uploaded
waqas
parents:
diff changeset
34 }' > tmp
c9636a827049 Uploaded
waqas
parents:
diff changeset
35
c9636a827049 Uploaded
waqas
parents:
diff changeset
36 while read line;
c9636a827049 Uploaded
waqas
parents:
diff changeset
37 do
c9636a827049 Uploaded
waqas
parents:
diff changeset
38 cb=$(echo $line | cut -d'.' -f1);
c9636a827049 Uploaded
waqas
parents:
diff changeset
39 ce=$(echo $line | cut -d'.' -f2);
c9636a827049 Uploaded
waqas
parents:
diff changeset
40 seq=$(echo $line | cut -d'.' -f3);
c9636a827049 Uploaded
waqas
parents:
diff changeset
41 echo $seq | cut -c$cb-$ce;
c9636a827049 Uploaded
waqas
parents:
diff changeset
42 done <tmp | sort | uniq -c | sort -n >> MACARON_validate.txt
c9636a827049 Uploaded
waqas
parents:
diff changeset
43 rm tmp
c9636a827049 Uploaded
waqas
parents:
diff changeset
44
c9636a827049 Uploaded
waqas
parents:
diff changeset
45
c9636a827049 Uploaded
waqas
parents:
diff changeset
46
c9636a827049 Uploaded
waqas
parents:
diff changeset
47
c9636a827049 Uploaded
waqas
parents:
diff changeset
48 exit 0
c9636a827049 Uploaded
waqas
parents:
diff changeset
49