annotate imgt_loader/imgt_loader.sh @ 52:124b7fd92a3e draft

Uploaded
author davidvanzessen
date Thu, 25 Feb 2021 13:36:15 +0000
parents 106275b54470
children 0ef7f80ea061
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
52
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
1 #!/bin/bash
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
2 input=$1
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
3 output=$2
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
4 name=$3
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
5 dir="$(cd "$(dirname "$0")" && pwd)"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
6 mkdir -p $PWD/$name/files
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
7 f=$(file $input)
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
8 zip7Type="7-zip archive"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
9 tarType="tar archive"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
10 bzip2Type="bzip2 compressed"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
11 gzipType="gzip compressed"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
12 zipType="Zip archive"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
13 rarType="RAR archive"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
14 zxType="XZ compressed data"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
15
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
16 if [[ "$f" == *"$zip7Type"* ]]; then
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
17 echo "7-zip"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
18 echo "Trying: 7za e $input -o$PWD/files/"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
19 7za e $input -o$PWD/$name/files
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
20 fi
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
21
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
22 if [[ "$f" == *"$tarType"* ]]
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
23 then
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
24 echo "tar archive"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
25 echo "Trying: tar xvf $input -C $PWD/files/"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
26 tar -xvf $input -C $PWD/$name/files
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
27 fi
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
28
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
29 if [[ "$f" == *"$bzip2Type"* ]]
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
30 then
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
31 echo "bzip2 compressed data"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
32 echo "Trying: tar jxf $input -C $PWD/files/"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
33 tar -jxf $input -C $PWD/$name/files
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
34 fi
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
35
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
36 if [[ "$f" == *"$gzipType"* ]]
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
37 then
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
38 echo "gzip compressed data"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
39 echo "Trying: tar xvzf $input -C $PWD/files/"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
40 tar -xvzf $input -C $PWD/$name/files
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
41 fi
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
42
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
43 if [[ "$f" == *"$zipType"* ]]
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
44 then
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
45 echo "Zip archive"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
46 echo "Trying: unzip $input -d $PWD/files/"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
47 unzip $input -d $PWD/$name/files > $PWD/unziplog.log
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
48 fi
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
49
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
50 if [[ "$f" == *"$rarType"* ]]
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
51 then
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
52 echo "RAR archive"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
53 echo "Trying: unrar e $input $PWD/files/"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
54 unrar e $input $PWD/$name/files
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
55 fi
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
56
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
57 if [[ "$f" == *"$zxType"* ]]
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
58 then
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
59 echo "xz compressed data"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
60 echo "Trying: tar -xJf $input -C $PWD/files/"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
61 tar xJf $input -C $PWD/$name/files
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
62 fi
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
63 find $PWD/$name/files -iname "1_*" -exec cat {} + > $PWD/$name/summ.txt
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
64 find $PWD/$name/files -iname "3_*" -exec cat {} + > $PWD/$name/sequences.txt
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
65 find $PWD/$name/files -iname "4_*" -exec cat {} + > $PWD/$name/gapped_aa.txt
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
66 find $PWD/$name/files -iname "5_*" -exec cat {} + > $PWD/$name/aa.txt
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
67 find $PWD/$name/files -iname "6_*" -exec cat {} + > $PWD/$name/junction.txt
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
68
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
69 echo "summ.txt `cat $PWD/$name/summ.txt | wc -l`"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
70 echo "aa.txt `cat $PWD/$name/aa.txt | wc -l`"
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
71
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
72 #python $dir/imgt_loader.py --summ $PWD/$name/summ.txt --aa $PWD/$name/aa.txt --junction $PWD/$name/junction.txt --output $output
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
73
124b7fd92a3e Uploaded
davidvanzessen
parents: 40
diff changeset
74 Rscript --verbose $dir/imgt_loader.r $PWD/$name/summ.txt $PWD/$name/sequences.txt $PWD/$name/aa.txt $PWD/$name/junction.txt $PWD/$name/gapped_aa.txt $output 2>&1