annotate wrapper.sh @ 115:ede6c4ee5196 draft

Uploaded
author davidvanzessen
date Tue, 09 Aug 2016 08:26:15 -0400
parents e7b550d52eb7
children 4984c2a06c43
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
2 #set -e
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
5 method=$2
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
6 log=$3 #becomes the main html page at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
7 outdir=$4
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
8 output="$outdir/index.html" #copied to $log location at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
9 title=$5
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
10 include_fr1=$6
34
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
11 functionality=$7
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
12 unique=$8
69
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
13 naive_output_ca=$9
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
14 naive_output_cg=${10}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
15 naive_output_cm=${11}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
16 filter_unique=${12}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
17 class_filter=${13}
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
18 empty_region_filter=${14}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
20
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
21 tar -xzf $dir/style.tar.gz -C $outdir
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
22
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
23 echo "---------------- read parameters ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
24 echo "---------------- read parameters ----------------<br />" > $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
25
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
26 echo "unpacking IMGT file"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
27
35
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
28 type="`file $input`"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
29 if [[ "$type" == *"Zip archive"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
30 echo "Zip archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
31 echo "unzip $input -d $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
32 unzip $input -d $PWD/files/
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
33 elif [[ "$type" == *"XZ compressed data"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
34 echo "ZX archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
35 echo "tar -xJf $input -C $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
36 mkdir -p $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
37 tar -xJf $input -C $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
38 fi
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
39
64
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
40 cat `find $PWD/files/ -name "1_*"` > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
41 cat `find $PWD/files/ -name "3_*"` > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
42 cat `find $PWD/files/ -name "5_*"` > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
43 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
44 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
45 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
46 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
47
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
48 #cat $PWD/files/*/1_* > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
49 #cat $PWD/files/*/3_* > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
50 #cat $PWD/files/*/5_* > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
51 #cat $PWD/files/*/6_* > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
52 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
53 #cat $PWD/files/*/8_* > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
54 #cat $PWD/files/*/10_* > $PWD/hotspots.txt
3
a0b27058dcac Uploaded
davidvanzessen
parents: 2
diff changeset
55
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
56 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
57
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
58 echo "${BLASTN_DIR}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
59
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
60 echo "---------------- identification ($method) ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
61 echo "---------------- identification ($method) ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
62
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
63 if [[ "${method}" == "custom" ]] ; then
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
64 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
65 else
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
66 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
67 ID_index=$((ID_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
68 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
69 sequence_index=$((sequence_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
70
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
71 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.tmp
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
72
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
73 cat $PWD/sequences.tmp | grep -B1 -vE "^$" sequences.fasta #filter out empty sequences
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
74
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
75 rm $PWD/sequences.tmp
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
76
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
77 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
78 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
79 fi
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
80
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
81 echo "---------------- merge_and_filter.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
82 echo "---------------- merge_and_filter.r ----------------<br />" >> $log
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
83
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
84 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/sequences.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/before_unique_filter.txt $outdir/unmatched.txt $method $functionality $unique ${filter_unique} ${class_filter} ${empty_region_filter} 2>&1
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
85
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
86 echo "---------------- creating new IMGT zip ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
87 echo "---------------- creating new IMGT zip ----------------<br />" >> $log
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
88
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
89 mkdir $outdir/new_IMGT
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
90
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
91 cat `find $PWD/files/ -name "1_*"` > "$outdir/new_IMGT/1_Summary.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
92 cat `find $PWD/files/ -name "2_*"` > "$outdir/new_IMGT/2_IMGT-gapped-nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
93 cat `find $PWD/files/ -name "3_*"` > "$outdir/new_IMGT/3_Nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
94 cat `find $PWD/files/ -name "4_*"` > "$outdir/new_IMGT/4_IMGT-gapped-AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
95 cat `find $PWD/files/ -name "5_*"` > "$outdir/new_IMGT/5_AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
96 cat `find $PWD/files/ -name "6_*"` > "$outdir/new_IMGT/6_Junction.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
97 cat `find $PWD/files/ -name "7_*"` > "$outdir/new_IMGT/7_V-REGION-mutation-and-AA-change-table.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
98 cat `find $PWD/files/ -name "8_*"` > "$outdir/new_IMGT/8_V-REGION-nt-mutation-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
99 cat `find $PWD/files/ -name "9_*"` > "$outdir/new_IMGT/9_V-REGION-AA-change-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
100 cat `find $PWD/files/ -name "10_*"` > "$outdir/new_IMGT/10_V-REGION-mutation-hotspots.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
101
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
102 mkdir $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
103 cp $outdir/new_IMGT/* $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
104
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
105 mkdir $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
106 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
107
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
108 mkdir $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
109 cp $outdir/new_IMGT/* $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
110
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
111 Rscript $dir/new_imgt.r $outdir/new_IMGT/ $outdir/merged.txt "-" 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
112 Rscript $dir/new_imgt.r $outdir/new_IMGT_ca/ $outdir/merged.txt "ca" 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
113 Rscript $dir/new_imgt.r $outdir/new_IMGT_cg/ $outdir/merged.txt "cg" 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
114 Rscript $dir/new_imgt.r $outdir/new_IMGT_cm/ $outdir/merged.txt "cm" 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
115
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
116
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
117 tmp="$PWD"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
118 cd $outdir/new_IMGT/ #tar weirdness...
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
119 tar -cJf ../new_IMGT.txz *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
120
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
121 cd $outdir/new_IMGT_ca/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
122 tar -cJf ../new_IMGT_ca.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
123
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
124 cd $outdir/new_IMGT_cg/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
125 tar -cJf ../new_IMGT_cg.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
126
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
127 cd $outdir/new_IMGT_cm/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
128 tar -cJf ../new_IMGT_cm.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
129
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
130 cd $tmp
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
131
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
132 echo "---------------- mutation_analysis.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
133 echo "---------------- mutation_analysis.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
134
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
135 classes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm,unmatched"
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
136 echo "R mutation analysis"
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
137 Rscript $dir/mutation_analysis.r $outdir/merged.txt $classes $outdir ${include_fr1} 2>&1
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
138
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
139
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
140 echo "---------------- mutation_analysis.py ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
141 echo "---------------- mutation_analysis.py ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
142
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
143 python $dir/mutation_analysis.py --input $outdir/merged.txt --genes $classes --includefr1 "${include_fr1}" --output $outdir/hotspot_analysis.txt
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
144
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
145 echo "---------------- aa_histogram.r ----------------"
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
146 echo "---------------- aa_histogram.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
147
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
148 Rscript $dir/aa_histogram.r $outdir/aa_id_mutations.txt $outdir/absent_aa_id.txt "ca,cg,cm" $outdir/ 2>&1
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
149 if [ -e "$outdir/aa_histogram_.png" ]; then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
150 mv $outdir/aa_histogram_.png $outdir/aa_histogram.png
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
151 mv $outdir/aa_histogram_.txt $outdir/aa_histogram.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
152 fi
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
153
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
154 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
155
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
156 funcs=(sum mean median)
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
157 funcs=(sum)
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
158
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
159 echo "---------------- sequence_overview.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
160 echo "---------------- sequence_overview.r ----------------<br />" >> $log
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
161
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
162 mkdir $outdir/sequence_overview
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
163
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
164 #Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
100
ff5be711382b Uploaded
davidvanzessen
parents: 99
diff changeset
165 Rscript $dir/sequence_overview.r $outdir/before_unique_filter.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
166
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
167 echo "<table border='1'>" > $outdir/base_overview.html
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
168
92
b869a126e2c4 Uploaded
davidvanzessen
parents: 90
diff changeset
169 while IFS=$'\t' read ID class seq A C G T
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
170 do
85
07f7da724a77 Uploaded
davidvanzessen
parents: 84
diff changeset
171 echo "<tr><td>$ID</td><td>$seq</td><td>$class</td><td>$A</td><td>$C</td><td>$G</td><td>$T</td></tr>" >> $outdir/base_overview.html
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
172 done < $outdir/sequence_overview/ntoverview.txt
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
173
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
174 echo "<html><center><h1>$title</h1></center>" > $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
175 echo "<script type='text/javascript' src='jquery-1.11.0.min.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
176 echo "<script type='text/javascript' src='tabber.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
177 echo "<script type='text/javascript' src='script.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
178 echo "<link rel='stylesheet' type='text/css' href='style.css'>" >> $output
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
179
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
180 #display the matched/unmatched for clearity
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
181
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
182 matched_count="`cat $outdir/merged.txt | grep -v 'unmatched' | tail -n +2 | wc -l`"
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
183 unmatched_count="`cat $outdir/unmatched.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
184 total_count=$((matched_count + unmatched_count))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
185 perc_count=$((unmatched_count / total_count * 100))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
186 perc_count=`bc -l <<< "scale=2; ${unmatched_count} / ${total_count} * 100"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
187 perc_count=`bc -l <<< "scale=2; (${unmatched_count} / ${total_count} * 100 ) / 1"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
188
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
189 echo "<center><h2>Total: ${total_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
190 echo "<center><h2>Matched: ${matched_count} Unmatched: ${unmatched_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
191 echo "<center><h2>Percentage unmatched: ${perc_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
192
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
193 echo "---------------- main tables ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
194 echo "---------------- main tables ----------------<br />" >> $log
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
195
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
196 echo "<div class='tabber'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
197 echo "<div class='tabbertab' title='SHM Overview'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
198
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
199 for func in ${funcs[@]}
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
200 do
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
201
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
202 echo "---------------- $func table ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
203 echo "---------------- $func table ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
204
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
205 cat $outdir/mutations_${func}.txt $outdir/hotspot_analysis_${func}.txt > $outdir/data_${func}.txt
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
206
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
207 echo "<table border='1' width='100%'><caption><h3><a href='data_${func}.txt'>${func} table</a></h3></caption>" >> $output
58
8bb4d6009e08 Uploaded
davidvanzessen
parents: 55
diff changeset
208 echo "<tr><th>info</th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
209 for gene in ${genes[@]}
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
210 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
211 tmp=`cat $outdir/${gene}_${func}_n.txt`
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
212 echo "<th><a href='matched_${gene}_${func}.txt'>${gene} (N = $tmp)</a></th>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
213 done
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
214
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
215 tmp=`cat $outdir/all_${func}_n.txt`
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
216 echo "<th><a href='matched_all_${func}.txt'>all (N = $tmp)</a></th>" >> $output
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
217 tmp=`cat $outdir/unmatched_${func}_n.txt`
79
0513b46178c4 Uploaded
davidvanzessen
parents: 78
diff changeset
218 echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
219
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
220 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
221 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
222 if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
223 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
224 else
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
225 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${allx}/${ally} (${allz}%)</td><td>${unx}/${uny} (${unz}%)</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
226 fi
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
227 done < $outdir/data_${func}.txt
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
228 echo "</table>" >> $output
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
229 #echo "<a href='data_${func}.txt'>Download data</a>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
230 done
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
231
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
232 echo "</div>" >> $output #SHM overview tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
233
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
234 echo "---------------- images ----------------"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
235 echo "---------------- images ----------------<br />" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
236
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
237 echo "<div class='tabbertab' title='SHM Frequency'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
238
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
239 if [ -a $outdir/scatter.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
240 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
241 echo "<img src='scatter.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
242 echo "<a href='scatter.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
243 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
244 if [ -a $outdir/frequency_ranges.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
245 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
246 echo "<img src='frequency_ranges.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
247 echo "<a href='frequency_ranges_classes.txt'>download class data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
248 echo "<a href='frequency_ranges_subclasses.txt'>download subclass data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
249 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
250
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
251 echo "</div>" >> $output #SHM frequency tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
252
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
253 echo "<div class='tabbertab' title='Transition tables'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
254
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
255 echo "<table border='0'>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
256
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
257 for gene in ${genes[@]}
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
258 do
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
259 echo "<tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
260 echo "<td><h1>${gene}</h1></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
261 echo "<td><img src='transitions_heatmap_${gene}.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
262 echo "<td><img src='transitions_stacked_${gene}.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
263 echo "<td><table border='1'>" >> $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
264 while IFS=, read from a c g t
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
265 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
266 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
267 done < $outdir/transitions_${gene}_sum.txt
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
268 echo "</table></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
269
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
270 echo "</tr>" >> $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
271 done
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
272
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
273 echo "<tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
274 echo "<td><h1>All</h1></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
275 echo "<td><img src='transitions_heatmap_all.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
276 echo "<td><img src='transitions_stacked_all.png' /></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
277 echo "<td><table border='1'>" >> $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
278 while IFS=, read from a c g t
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
279 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
280 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
281 done < $outdir/transitions_all_sum.txt
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
282 echo "</table></td>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
283
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
284 echo "</tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
285
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
286 echo "</table>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
287
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
288 echo "</div>" >> $output #transition tables tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
289
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
290 echo "<div class='tabbertab' title='Antigen Selection'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
291
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
292 if [ -a $outdir/aa_histogram.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
293 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
294 echo "<img src='aa_histogram.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
295 echo "<a href='aa_histogram.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
296 echo "<img src='aa_histogram_ca.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
297 echo "<a href='aa_histogram_ca.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
298 echo "<img src='aa_histogram_cg.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
299 echo "<a href='aa_histogram_cg.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
300 echo "<img src='aa_histogram_cm.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
301 echo "<a href='aa_histogram_cm.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
302 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
303
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
304 echo "<embed src='baseline_ca.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
305 echo "<embed src='baseline_cg.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
306 echo "<embed src='baseline_cm.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
307
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
308 echo "</div>" >> $output #antigen selection tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
309
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
310 echo "<div class='tabbertab' title='CSR'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
311
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
312 if [ -a $outdir/ca.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
313 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
314 echo "<img src='ca.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
315 echo "<a href='ca.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
316 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
317 if [ -a $outdir/cg.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
318 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
319 echo "<img src='cg.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
320 echo "<a href='cg.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
321 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
322
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
323 echo "</div>" >> $output #CSR tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
324
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
325 echo "<div class='tabbertab' title='Downloads'>" >> $output
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
326
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
327 echo "<table border='1' width='700px'>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
328 echo "<tr><td>The complete dataset</td><td><a href='merged.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
329 echo "<tr><td>The alignment info on the unmatched sequences</td><td><a href='unmatched.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
330 echo "<tr><td>Motif data per sequence ID</td><td><a href='motif_per_seq.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
331 echo "<tr><td>Mutation data per sequence ID</td><td><a href='mutation_by_id.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
332 echo "<tr><td>AA mutation data per sequence ID</td><td><a href='aa_id_mutations.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
333 echo "<tr><td>Absent AA location data per sequence ID</td><td><a href='absent_aa_id.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
334 echo "<tr><td>CDR1+FR2+CDR2+FR3+CDR3 sequences that show up more than once</td><td><a href='sequence_overview/index.html'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
335 echo "<tr><td>Base count for every sequence</td><td><a href='base_overview.html'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
336 echo "<tr><td>Baseline PDF (<href a='http://selection.med.yale.edu/baseline/'>http://selection.med.yale.edu/baseline/</a>)</td><td><a href='baseline.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
337 echo "<tr><td>Baseline data</td><td><a href='baseline.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
338 echo "<tr><td>Baseline ca PDF</td><td><a href='baseline_ca.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
339 echo "<tr><td>Baseline ca data</td><td><a href='baseline_ca.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
340 echo "<tr><td>Baseline cg PDF</td><td><a href='baseline_cg.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
341 echo "<tr><td>Baseline cg data</td><td><a href='baseline_cg.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
342 echo "<tr><td>Baseline cm PDF</td><td><a href='baseline_cm.pdf'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
343 echo "<tr><td>Baseline cm data</td><td><a href='baseline_cm.txt'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
344 #echo "<tr><td></td><td><a href='IgAT.zip'>IgAT zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
345 #echo "<tr><td></td><td><a href='IgAT_ca.zip'>IgAT ca zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
346 #echo "<tr><td></td><td><a href='IgAT_cg.zip'>IgAT cg zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
347 #echo "<tr><td></td><td><a href='IgAT_cm.zip'>IgAT cm zip</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
348 echo "<tr><td>An IMGT archive with just the matched and filtered sequences</td><td><a href='new_IMGT.txz'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
349 echo "<tr><td>An IMGT archive with just the matched and filtered ca sequences</td><td><a href='new_IMGT_ca.txz'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
350 echo "<tr><td>An IMGT archive with just the matched and filtered cg sequences</td><td><a href='new_IMGT_cg.txz'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
351 echo "<tr><td>An IMGT archive with just the matched and filtered cm sequences</td><td><a href='new_IMGT_cm.txz'>Download</a></td></tr>" >> $output
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
352 echo "</table>" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
353
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
354 echo "</div>" >> $output #downloads tab end
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
355
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
356 echo "</div>" >> $output #tabs end
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
357
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
358 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
359
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
360 echo "---------------- baseline ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
361 echo "---------------- baseline ----------------<br />" >> $log
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
362 tmp="$PWD"
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
363
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
364 mkdir $outdir/baseline
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
365
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
366
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
367 mkdir $outdir/baseline/ca_cg_cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
368 if [[ $(wc -l < $outdir/new_IMGT/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
369 cd $outdir/baseline/ca_cg_cm
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
370 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT.txz "ca_cg_cm" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline.pdf" "Sequence.ID" "$outdir/baseline.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
371 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
372 echo "No sequences" > "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
373 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
374
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
375 mkdir $outdir/baseline/ca
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
376 if [[ $(wc -l < $outdir/new_IMGT_ca/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
377 cd $outdir/baseline/ca
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
378 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_ca.txz "ca" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_ca.pdf" "Sequence.ID" "$outdir/baseline_ca.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
379 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
380 echo "No ca sequences" > "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
381 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
382
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
383 mkdir $outdir/baseline/cg
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
384 if [[ $(wc -l < $outdir/new_IMGT_cg/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
385 cd $outdir/baseline/cg
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
386 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cg.txz "cg" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cg.pdf" "Sequence.ID" "$outdir/baseline_cg.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
387 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
388 echo "No cg sequences" > "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
389 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
390
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
391 mkdir $outdir/baseline/cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
392 if [[ $(wc -l < $outdir/new_IMGT_cm/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
393 cd $outdir/baseline/cm
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
394 bash $dir/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cm.txz "cm" "$dir/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cm.pdf" "Sequence.ID" "$outdir/baseline_cm.txt"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
395 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
396 echo "No cm sequences" > "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
397 fi
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
398
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
399 cd $tmp
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
400
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
401 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
402 echo "---------------- naive_output.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
403
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
404 if [[ "$naive_output" != "None" ]]
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
405 then
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
406 #echo "---------------- imgt_loader.r ----------------"
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
407 #echo "---------------- imgt_loader.r ----------------<br />" >> $log
50
8ba6afa1247a Uploaded
davidvanzessen
parents: 49
diff changeset
408 #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
409 #Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
410
114
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
411 #echo "---------------- naive_output.r ----------------"
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
412 #echo "---------------- naive_output.r ----------------<br />" >> $log
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
413 #Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
414
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
415 cp $outdir/new_IMGT_ca.txz ${naive_output_ca}
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
416 cp $outdir/new_IMGT_cg.txz ${naive_output_cg}
e7b550d52eb7 Uploaded
davidvanzessen
parents: 110
diff changeset
417 cp $outdir/new_IMGT_cm.txz ${naive_output_cm}
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
418 fi
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
419
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
420 echo "</table>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
421
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
422 mv $log $outdir/log.html
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
423
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
424 echo "<html><center><h1><a href='index.html'>Click here for the results</a></h1>Tip: Open it in a new tab (middle mouse button or right mouse button -> 'open in new tab' on the link above)<br />" > $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
425 echo "<table border = 1>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
426 echo "<thead><tr><th>Info</th><th>Sequences</th><th>Percentage</th></tr></thead>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
427 tIFS="$TMP"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
428 IFS=$'\t'
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
429 while read step seq perc
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
430 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
431 echo "<tr>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
432 echo "<td>$step</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
433 echo "<td>$seq</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
434 echo "<td>${perc}%</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
435 echo "</tr>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
436 done < $outdir/filtering_steps.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
437 echo "</table border></center></html>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
438
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
439 IFS="$tIFS"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
440
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
441
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
442 echo "---------------- Done! ----------------"
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
443 echo "---------------- Done! ----------------<br />" >> $outdir/log.html
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
444
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
445
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
446
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
447
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
448
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
449
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
450
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
451
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
452
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
453
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
454
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
455
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
456
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
457
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
458
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
459
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
460
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
461
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
462
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
463
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
464