annotate wrapper.sh @ 116:4984c2a06c43 draft

Uploaded
author davidvanzessen
date Wed, 10 Aug 2016 08:20:17 -0400
parents e7b550d52eb7
children a8f91c52411c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
2 #set -e
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
5 method=$2
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
6 log=$3 #becomes the main html page at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
7 outdir=$4
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
8 output="$outdir/index.html" #copied to $log location at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
9 title=$5
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
10 include_fr1=$6
34
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
11 functionality=$7
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
12 unique=$8
69
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
13 naive_output_ca=$9
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
14 naive_output_cg=${10}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
15 naive_output_cm=${11}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
16 filter_unique=${12}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
17 class_filter=${13}
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
18 empty_region_filter=${14}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
20
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
21 tar -xzf $dir/style.tar.gz -C $outdir
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
22
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
23 echo "---------------- read parameters ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
24 echo "---------------- read parameters ----------------<br />" > $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
25
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
26 echo "unpacking IMGT file"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
27
35
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
28 type="`file $input`"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
29 if [[ "$type" == *"Zip archive"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
30 echo "Zip archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
31 echo "unzip $input -d $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
32 unzip $input -d $PWD/files/
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
33 elif [[ "$type" == *"XZ compressed data"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
34 echo "ZX archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
35 echo "tar -xJf $input -C $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
36 mkdir -p $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
37 tar -xJf $input -C $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
38 fi
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
39
64
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
40 cat `find $PWD/files/ -name "1_*"` > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
41 cat `find $PWD/files/ -name "3_*"` > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
42 cat `find $PWD/files/ -name "5_*"` > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
43 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
44 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
45 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
46 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
47
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
48 #cat $PWD/files/*/1_* > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
49 #cat $PWD/files/*/3_* > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
50 #cat $PWD/files/*/5_* > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
51 #cat $PWD/files/*/6_* > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
52 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
53 #cat $PWD/files/*/8_* > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
54 #cat $PWD/files/*/10_* > $PWD/hotspots.txt
3
a0b27058dcac Uploaded
davidvanzessen
parents: 2
diff changeset
55
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
56 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
57
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
58 echo "${BLASTN_DIR}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
59
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
60 echo "---------------- identification ($method) ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
61 echo "---------------- identification ($method) ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
62
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
63 if [[ "${method}" == "custom" ]] ; then
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
64 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
65 else
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
66 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
67 ID_index=$((ID_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
68 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
69 sequence_index=$((sequence_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
70
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
71 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.tmp
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
72
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
73 cat $PWD/sequences.tmp | grep -B1 -vE "^$" sequences.fasta #filter out empty sequences
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
74
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
75 rm $PWD/sequences.tmp
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
76
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
77 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
78 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
79 fi
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
80
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
81 echo "---------------- merge_and_filter.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
82 echo "---------------- merge_and_filter.r ----------------<br />" >> $log
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
83
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
84 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/sequences.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/before_unique_filter.txt $outdir/unmatched.txt $method $functionality $unique ${filter_unique} ${class_filter} ${empty_region_filter} 2>&1
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
85
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
86 echo "---------------- creating new IMGT zip ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
87 echo "---------------- creating new IMGT zip ----------------<br />" >> $log
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
88
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
89 mkdir $outdir/new_IMGT
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
90
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
91 cat `find $PWD/files/ -name "1_*"` > "$outdir/new_IMGT/1_Summary.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
92 cat `find $PWD/files/ -name "2_*"` > "$outdir/new_IMGT/2_IMGT-gapped-nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
93 cat `find $PWD/files/ -name "3_*"` > "$outdir/new_IMGT/3_Nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
94 cat `find $PWD/files/ -name "4_*"` > "$outdir/new_IMGT/4_IMGT-gapped-AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
95 cat `find $PWD/files/ -name "5_*"` > "$outdir/new_IMGT/5_AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
96 cat `find $PWD/files/ -name "6_*"` > "$outdir/new_IMGT/6_Junction.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
97 cat `find $PWD/files/ -name "7_*"` > "$outdir/new_IMGT/7_V-REGION-mutation-and-AA-change-table.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
98 cat `find $PWD/files/ -name "8_*"` > "$outdir/new_IMGT/8_V-REGION-nt-mutation-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
99 cat `find $PWD/files/ -name "9_*"` > "$outdir/new_IMGT/9_V-REGION-AA-change-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
100 cat `find $PWD/files/ -name "10_*"` > "$outdir/new_IMGT/10_V-REGION-mutation-hotspots.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
101
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
102 mkdir $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
103 cp $outdir/new_IMGT/* $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
104
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
105 mkdir $outdir/new_IMGT_ca1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
106 cp $outdir/new_IMGT/* $outdir/new_IMGT_ca1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
107
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
108 mkdir $outdir/new_IMGT_ca2
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
109 cp $outdir/new_IMGT/* $outdir/new_IMGT_ca2
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
110
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
111 mkdir $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
112 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
113
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
114 mkdir $outdir/new_IMGT_cg1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
115 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
117 mkdir $outdir/new_IMGT_cg2
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
118 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg2
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
119
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
120 mkdir $outdir/new_IMGT_cg3
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
121 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg3
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
122
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
123 mkdir $outdir/new_IMGT_cg4
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
124 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg4
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
125
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
126 mkdir $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
127 cp $outdir/new_IMGT/* $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
128
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
129 Rscript $dir/new_imgt.r $outdir/new_IMGT/ $outdir/merged.txt "-" 2>&1
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
130
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
131 Rscript $dir/new_imgt.r $outdir/new_IMGT_ca/ $outdir/merged.txt "ca" 2>&1
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
132 Rscript $dir/new_imgt.r $outdir/new_IMGT_ca1/ $outdir/merged.txt "ca1" 2>&1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
133 Rscript $dir/new_imgt.r $outdir/new_IMGT_ca2/ $outdir/merged.txt "ca2" 2>&1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
134
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
135 Rscript $dir/new_imgt.r $outdir/new_IMGT_cg/ $outdir/merged.txt "cg" 2>&1
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
136 Rscript $dir/new_imgt.r $outdir/new_IMGT_cg1/ $outdir/merged.txt "cg1" 2>&1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
137 Rscript $dir/new_imgt.r $outdir/new_IMGT_cg2/ $outdir/merged.txt "cg2" 2>&1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
138 Rscript $dir/new_imgt.r $outdir/new_IMGT_cg3/ $outdir/merged.txt "cg3" 2>&1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
139 Rscript $dir/new_imgt.r $outdir/new_IMGT_cg4/ $outdir/merged.txt "cg4" 2>&1
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
140
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
141 Rscript $dir/new_imgt.r $outdir/new_IMGT_cm/ $outdir/merged.txt "cm" 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
142
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
143
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
144 tmp="$PWD"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
145 cd $outdir/new_IMGT/ #tar weirdness...
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
146 tar -cJf ../new_IMGT.txz *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
147
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
148 cd $outdir/new_IMGT_ca/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
149 tar -cJf ../new_IMGT_ca.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
150
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
151 cd $outdir/new_IMGT_cg/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
152 tar -cJf ../new_IMGT_cg.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
153
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
154 cd $outdir/new_IMGT_cm/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
155 tar -cJf ../new_IMGT_cm.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
156
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
157 cd $tmp
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
158
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
159 echo "---------------- mutation_analysis.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
160 echo "---------------- mutation_analysis.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
161
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
162 classes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm,unmatched"
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
163 echo "R mutation analysis"
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
164 Rscript $dir/mutation_analysis.r $outdir/merged.txt $classes $outdir ${include_fr1} 2>&1
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
165
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
166
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
167 echo "---------------- mutation_analysis.py ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
168 echo "---------------- mutation_analysis.py ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
169
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
170 python $dir/mutation_analysis.py --input $outdir/merged.txt --genes $classes --includefr1 "${include_fr1}" --output $outdir/hotspot_analysis.txt
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
171
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
172 echo "---------------- aa_histogram.r ----------------"
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
173 echo "---------------- aa_histogram.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
174
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
175 Rscript $dir/aa_histogram.r $outdir/aa_id_mutations.txt $outdir/absent_aa_id.txt "ca,cg,cm" $outdir/ 2>&1
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
176 if [ -e "$outdir/aa_histogram_.png" ]; then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
177 mv $outdir/aa_histogram_.png $outdir/aa_histogram.png
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
178 mv $outdir/aa_histogram_.txt $outdir/aa_histogram.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
179 fi
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
180
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
181 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
182
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
183 funcs=(sum mean median)
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
184 funcs=(sum)
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
185
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
186 echo "---------------- sequence_overview.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
187 echo "---------------- sequence_overview.r ----------------<br />" >> $log
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
188
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
189 mkdir $outdir/sequence_overview
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
190
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
191 #Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
100
ff5be711382b Uploaded
davidvanzessen
parents: 99
diff changeset
192 Rscript $dir/sequence_overview.r $outdir/before_unique_filter.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
193
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
194 echo "<table border='1'>" > $outdir/base_overview.html
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
195
92
b869a126e2c4 Uploaded
davidvanzessen
parents: 90
diff changeset
196 while IFS=$'\t' read ID class seq A C G T
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
197 do
85
07f7da724a77 Uploaded
davidvanzessen
parents: 84
diff changeset
198 echo "<tr><td>$ID</td><td>$seq</td><td>$class</td><td>$A</td><td>$C</td><td>$G</td><td>$T</td></tr>" >> $outdir/base_overview.html
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
199 done < $outdir/sequence_overview/ntoverview.txt
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
200
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
201 echo "<html><center><h1>$title</h1></center>" > $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
202 echo "<script type='text/javascript' src='jquery-1.11.0.min.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
203 echo "<script type='text/javascript' src='tabber.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
204 echo "<script type='text/javascript' src='script.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
205 echo "<link rel='stylesheet' type='text/css' href='style.css'>" >> $output
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
206
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
207 #display the matched/unmatched for clearity
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
208
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
209 matched_count="`cat $outdir/merged.txt | grep -v 'unmatched' | tail -n +2 | wc -l`"
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
210 unmatched_count="`cat $outdir/unmatched.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
211 total_count=$((matched_count + unmatched_count))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
212 perc_count=$((unmatched_count / total_count * 100))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
213 perc_count=`bc -l <<< "scale=2; ${unmatched_count} / ${total_count} * 100"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
214 perc_count=`bc -l <<< "scale=2; (${unmatched_count} / ${total_count} * 100 ) / 1"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
215
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
216 echo "<center><h2>Total: ${total_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
217 echo "<center><h2>Matched: ${matched_count} Unmatched: ${unmatched_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
218 echo "<center><h2>Percentage unmatched: ${perc_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
219
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
220 echo "---------------- main tables ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
221 echo "---------------- main tables ----------------<br />" >> $log
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
222
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
223 echo "<div class='tabber'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
224 echo "<div class='tabbertab' title='SHM Overview'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
225
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
226 for func in ${funcs[@]}
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
227 do
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
228
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
229 echo "---------------- $func table ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
230 echo "---------------- $func table ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
231
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
232 cat $outdir/mutations_${func}.txt $outdir/hotspot_analysis_${func}.txt > $outdir/data_${func}.txt
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
233
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
234 echo "<table border='1' width='100%'><caption><h3><a href='data_${func}.txt'>${func} table</a></h3></caption>" >> $output
58
8bb4d6009e08 Uploaded
davidvanzessen
parents: 55
diff changeset
235 echo "<tr><th>info</th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
236 for gene in ${genes[@]}
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
237 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
238 tmp=`cat $outdir/${gene}_${func}_n.txt`
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
239 echo "<th><a href='matched_${gene}_${func}.txt'>${gene} (N = $tmp)</a></th>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
240 done
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
241
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
242 tmp=`cat $outdir/all_${func}_n.txt`
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
243 echo "<th><a href='matched_all_${func}.txt'>all (N = $tmp)</a></th>" >> $output
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
244 tmp=`cat $outdir/unmatched_${func}_n.txt`
79
0513b46178c4 Uploaded
davidvanzessen
parents: 78
diff changeset
245 echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
246
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
247 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
248 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
249 if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
250 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
251 else
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
252 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${allx}/${ally} (${allz}%)</td><td>${unx}/${uny} (${unz}%)</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
253 fi
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
254 done < $outdir/data_${func}.txt
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
255 echo "</table>" >> $output
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
256 #echo "<a href='data_${func}.txt'>Download data</a>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
257 done
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
258
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
259 echo "</div>" >> $output #SHM overview tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
260
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
261 echo "---------------- images ----------------"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
262 echo "---------------- images ----------------<br />" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
263
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
264 echo "<div class='tabbertab' title='SHM Frequency'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
265
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
266 if [ -a $outdir/scatter.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
267 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
268 echo "<img src='scatter.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
269 echo "<a href='scatter.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
270 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
271 if [ -a $outdir/frequency_ranges.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
272 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
273 echo "<img src='frequency_ranges.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
274 echo "<a href='frequency_ranges_classes.txt'>download class data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
275 echo "<a href='frequency_ranges_subclasses.txt'>download subclass data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
276 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
277
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
278 echo "</div>" >> $output #SHM frequency tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
279
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
280 echo "<div class='tabbertab' title='Transition tables'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
281
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
282 echo "<table border='0'>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
283
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
284 for gene in ${genes[@]}
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
285 do
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
286 echo "<tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
287 echo "<td><h1>${gene}</h1></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
288 echo "<td><img src='transitions_heatmap_${gene}.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
289 echo "<td><img src='transitions_stacked_${gene}.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
290 echo "<td><table border='1'>" >> $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
291 while IFS=, read from a c g t
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
292 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
293 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
294 done < $outdir/transitions_${gene}_sum.txt
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
295 echo "</table></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
296
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
297 echo "</tr>" >> $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
298 done
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
299
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
300 echo "<tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
301 echo "<td><h1>All</h1></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
302 echo "<td><img src='transitions_heatmap_all.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
303 echo "<td><img src='transitions_stacked_all.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
304 echo "<td><table border='1'>" >> $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
305 while IFS=, read from a c g t
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
306 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
307 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
308 done < $outdir/transitions_all_sum.txt
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
309 echo "</table></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
310
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
311 echo "</tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
312
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
313 echo "</table>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
314
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
315 echo "</div>" >> $output #transition tables tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
316
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
317 echo "<div class='tabbertab' title='Antigen Selection'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
318
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
319 if [ -a $outdir/aa_histogram.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
320 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
321 echo "<img src='aa_histogram.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
322 echo "<a href='aa_histogram.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
323 echo "<img src='aa_histogram_ca.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
324 echo "<a href='aa_histogram_ca.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
325 echo "<img src='aa_histogram_cg.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
326 echo "<a href='aa_histogram_cg.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
327 echo "<img src='aa_histogram_cm.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
328 echo "<a href='aa_histogram_cm.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
329 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
330
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
331 echo "<embed src='baseline_ca.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
332 echo "<embed src='baseline_cg.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
333 echo "<embed src='baseline_cm.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
334
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
335 echo "</div>" >> $output #antigen selection tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
336
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
337 echo "<div class='tabbertab' title='CSR'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
338
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
339 if [ -a $outdir/ca.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
340 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
341 echo "<img src='ca.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
342 echo "<a href='ca.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
343 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
344 if [ -a $outdir/cg.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
345 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
346 echo "<img src='cg.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
347 echo "<a href='cg.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
348 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
349
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
350 echo "</div>" >> $output #CSR tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
351
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
352 echo "<div class='tabbertab' title='Downloads'>" >> $output
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
353
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
354 echo "<table border='1' width='700px'>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
355 echo "<tr><td>The complete dataset</td><td><a href='merged.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
356 echo "<tr><td>The alignment info on the unmatched sequences</td><td><a href='unmatched.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
357 echo "<tr><td>Motif data per sequence ID</td><td><a href='motif_per_seq.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
358 echo "<tr><td>Mutation data per sequence ID</td><td><a href='mutation_by_id.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
359 echo "<tr><td>AA mutation data per sequence ID</td><td><a href='aa_id_mutations.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
360 echo "<tr><td>Absent AA location data per sequence ID</td><td><a href='absent_aa_id.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
361 echo "<tr><td>CDR1+FR2+CDR2+FR3+CDR3 sequences that show up more than once</td><td><a href='sequence_overview/index.html'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
362 echo "<tr><td>Base count for every sequence</td><td><a href='base_overview.html'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
363 echo "<tr><td>Baseline PDF (<href a='http://selection.med.yale.edu/baseline/'>http://selection.med.yale.edu/baseline/</a>)</td><td><a href='baseline.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
364 echo "<tr><td>Baseline data</td><td><a href='baseline.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
365 echo "<tr><td>Baseline ca PDF</td><td><a href='baseline_ca.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
366 echo "<tr><td>Baseline ca data</td><td><a href='baseline_ca.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
367 echo "<tr><td>Baseline cg PDF</td><td><a href='baseline_cg.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
368 echo "<tr><td>Baseline cg data</td><td><a href='baseline_cg.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
369 echo "<tr><td>Baseline cm PDF</td><td><a href='baseline_cm.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
370 echo "<tr><td>Baseline cm data</td><td><a href='baseline_cm.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
371 #echo "<tr><td></td><td><a href='IgAT.zip'>IgAT zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
372 #echo "<tr><td></td><td><a href='IgAT_ca.zip'>IgAT ca zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
373 #echo "<tr><td></td><td><a href='IgAT_cg.zip'>IgAT cg zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
374 #echo "<tr><td></td><td><a href='IgAT_cm.zip'>IgAT cm zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
375 echo "<tr><td>An IMGT archive with just the matched and filtered sequences</td><td><a href='new_IMGT.txz'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
376 echo "<tr><td>An IMGT archive with just the matched and filtered ca sequences</td><td><a href='new_IMGT_ca.txz'>Download</a></td></tr>" >> $output
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
377 echo "<tr><td>An IMGT archive with just the matched and filtered ca1 sequences</td><td><a href='new_IMGT_ca1.txz'>Download</a></td></tr>" >> $output
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
378 echo "<tr><td>An IMGT archive with just the matched and filtered ca2 sequences</td><td><a href='new_IMGT_ca2.txz'>Download</a></td></tr>" >> $output
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
379 echo "<tr><td>An IMGT archive with just the matched and filtered cg sequences</td><td><a href='new_IMGT_cg.txz'>Download</a></td></tr>" >> $output
116
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
380 echo "<tr><td>An IMGT archive with just the matched and filtered cg1 sequences</td><td><a href='new_IMGT_cg1.txz'>Download</a></td></tr>" >> $output
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
381 echo "<tr><td>An IMGT archive with just the matched and filtered cg2 sequences</td><td><a href='new_IMGT_cg2.txz'>Download</a></td></tr>" >> $output
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
382 echo "<tr><td>An IMGT archive with just the matched and filtered cg3 sequences</td><td><a href='new_IMGT_cg3.txz'>Download</a></td></tr>" >> $output
4984c2a06c43 Uploaded
davidvanzessen
parents: 114
diff changeset
383 echo "<tr><td>An IMGT archive with just the matched and filtered cg4 sequences</td><td><a href='new_IMGT_cg4.txz'>Download</a></td></tr>" >> $output
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
384 echo "<tr><td>An IMGT archive with just the matched and filtered cm sequences</td><td><a href='new_IMGT_cm.txz'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
385 echo "</table>" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
386
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
387 echo "</div>" >> $output #downloads tab end
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
388
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
389 echo "</div>" >> $output #tabs end
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
390
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
391 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
392
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
393 echo "---------------- baseline ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
394 echo "---------------- baseline ----------------<br />" >> $log
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
395 tmp="$PWD"
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
396
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
397 mkdir $outdir/baseline
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
398
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
399
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
400 mkdir $outdir/baseline/ca_cg_cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
401 if [[ $(wc -l < $outdir/new_IMGT/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
402 cd $outdir/baseline/ca_cg_cm
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
403 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT.txz "ca_cg_cm" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline.pdf" "Sequence.ID" "$outdir/baseline.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
404 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
405 echo "No sequences" > "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
406 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
407
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
408 mkdir $outdir/baseline/ca
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
409 if [[ $(wc -l < $outdir/new_IMGT_ca/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
410 cd $outdir/baseline/ca
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
411 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_ca.txz "ca" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_ca.pdf" "Sequence.ID" "$outdir/baseline_ca.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
412 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
413 echo "No ca sequences" > "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
414 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
415
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
416 mkdir $outdir/baseline/cg
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
417 if [[ $(wc -l < $outdir/new_IMGT_cg/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
418 cd $outdir/baseline/cg
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
419 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cg.txz "cg" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cg.pdf" "Sequence.ID" "$outdir/baseline_cg.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
420 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
421 echo "No cg sequences" > "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
422 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
423
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
424 mkdir $outdir/baseline/cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
425 if [[ $(wc -l < $outdir/new_IMGT_cm/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
426 cd $outdir/baseline/cm
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
427 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cm.txz "cm" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cm.pdf" "Sequence.ID" "$outdir/baseline_cm.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
428 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
429 echo "No cm sequences" > "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
430 fi
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
431
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
432 cd $tmp
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
433
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
434 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
435 echo "---------------- naive_output.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
436
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
437 if [[ "$naive_output" != "None" ]]
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
438 then
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
439 #echo "---------------- imgt_loader.r ----------------"
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
440 #echo "---------------- imgt_loader.r ----------------<br />" >> $log
50
8ba6afa1247a Uploaded
davidvanzessen
parents: 49
diff changeset
441 #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
442 #Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
443
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
444 #echo "---------------- naive_output.r ----------------"
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
445 #echo "---------------- naive_output.r ----------------<br />" >> $log
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
446 #Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
447
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
448 cp $outdir/new_IMGT_ca.txz ${naive_output_ca}
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
449 cp $outdir/new_IMGT_cg.txz ${naive_output_cg}
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
450 cp $outdir/new_IMGT_cm.txz ${naive_output_cm}
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
451 fi
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
452
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
453 echo "</table>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
454
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
455 mv $log $outdir/log.html
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
456
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
457 echo "<html><center><h1><a href='index.html'>Click here for the results</a></h1>Tip: Open it in a new tab (middle mouse button or right mouse button -> 'open in new tab' on the link above)<br />" > $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
458 echo "<table border = 1>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
459 echo "<thead><tr><th>Info</th><th>Sequences</th><th>Percentage</th></tr></thead>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
460 tIFS="$TMP"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
461 IFS=$'\t'
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
462 while read step seq perc
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
463 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
464 echo "<tr>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
465 echo "<td>$step</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
466 echo "<td>$seq</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
467 echo "<td>${perc}%</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
468 echo "</tr>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
469 done < $outdir/filtering_steps.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
470 echo "</table border></center></html>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
471
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
472 IFS="$tIFS"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
473
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
474
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
475 echo "---------------- Done! ----------------"
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
476 echo "---------------- Done! ----------------<br />" >> $outdir/log.html
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
477
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
478
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
479
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
480
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
481
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
482
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
483
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
484
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
485
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
486
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
487
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
488
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
489
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
490
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
491
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
492
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
493
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
494
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
495
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
496
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
497