annotate wrapper.sh @ 110:ade5cf6fd2dc draft

Uploaded
author davidvanzessen
date Tue, 02 Aug 2016 08:30:23 -0400
parents 6add3e66f4fa
children e7b550d52eb7
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
2 #set -e
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
5 method=$2
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
6 log=$3 #becomes the main html page at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
7 outdir=$4
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
8 output="$outdir/index.html" #copied to $log location at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
9 title=$5
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
10 include_fr1=$6
34
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
11 functionality=$7
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
12 unique=$8
69
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
13 naive_output_ca=$9
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
14 naive_output_cg=${10}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
15 naive_output_cm=${11}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
16 filter_unique=${12}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
17 class_filter=${13}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
20 tar -xzf $dir/style.tar.gz -C $outdir
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
21
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
22 echo "---------------- read parameters ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
23 echo "---------------- read parameters ----------------<br />" > $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
24
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
25 echo "unpacking IMGT file"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
26
35
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
27 type="`file $input`"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
28 if [[ "$type" == *"Zip archive"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
29 echo "Zip archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
30 echo "unzip $input -d $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
31 unzip $input -d $PWD/files/
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
32 elif [[ "$type" == *"XZ compressed data"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
33 echo "ZX archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
34 echo "tar -xJf $input -C $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
35 mkdir -p $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
36 tar -xJf $input -C $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
37 fi
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
38
64
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
39 cat `find $PWD/files/ -name "1_*"` > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
40 cat `find $PWD/files/ -name "3_*"` > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
41 cat `find $PWD/files/ -name "5_*"` > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
42 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
43 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
44 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
45 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
46
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
47 #cat $PWD/files/*/1_* > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
48 #cat $PWD/files/*/3_* > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
49 #cat $PWD/files/*/5_* > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
50 #cat $PWD/files/*/6_* > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
51 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
52 #cat $PWD/files/*/8_* > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
53 #cat $PWD/files/*/10_* > $PWD/hotspots.txt
3
a0b27058dcac Uploaded
davidvanzessen
parents: 2
diff changeset
54
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
55 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
56
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
57 echo "${BLASTN_DIR}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
58
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
59 echo "---------------- identification ($method) ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
60 echo "---------------- identification ($method) ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
61
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
62 if [[ "${method}" == "custom" ]] ; then
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
63 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
64 else
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
65 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
66 ID_index=$((ID_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
67 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
68 sequence_index=$((sequence_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
69
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
70 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.tmp
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
71
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
72 cat $PWD/sequences.tmp | grep -B1 -vE "^$" sequences.fasta #filter out empty sequences
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
73
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
74 rm $PWD/sequences.tmp
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
75
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
76 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
77 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
78 fi
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
79
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
80 echo "---------------- merge_and_filter.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
81 echo "---------------- merge_and_filter.r ----------------<br />" >> $log
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
82
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
83 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/sequences.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/before_unique_filter.txt $outdir/unmatched.txt $method $functionality $unique ${filter_unique} ${class_filter} 2>&1
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
84
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
85 echo "---------------- creating new IMGT zip ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
86 echo "---------------- creating new IMGT zip ----------------<br />" >> $log
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
87
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
88 mkdir $outdir/new_IMGT
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
89
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
90 cat `find $PWD/files/ -name "1_*"` > "$outdir/new_IMGT/1_Summary.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
91 cat `find $PWD/files/ -name "2_*"` > "$outdir/new_IMGT/2_IMGT-gapped-nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
92 cat `find $PWD/files/ -name "3_*"` > "$outdir/new_IMGT/3_Nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
93 cat `find $PWD/files/ -name "4_*"` > "$outdir/new_IMGT/4_IMGT-gapped-AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
94 cat `find $PWD/files/ -name "5_*"` > "$outdir/new_IMGT/5_AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
95 cat `find $PWD/files/ -name "6_*"` > "$outdir/new_IMGT/6_Junction.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
96 cat `find $PWD/files/ -name "7_*"` > "$outdir/new_IMGT/7_V-REGION-mutation-and-AA-change-table.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
97 cat `find $PWD/files/ -name "8_*"` > "$outdir/new_IMGT/8_V-REGION-nt-mutation-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
98 cat `find $PWD/files/ -name "9_*"` > "$outdir/new_IMGT/9_V-REGION-AA-change-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
99 cat `find $PWD/files/ -name "10_*"` > "$outdir/new_IMGT/10_V-REGION-mutation-hotspots.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
100
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
101 mkdir $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
102 cp $outdir/new_IMGT/* $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
103
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
104 mkdir $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
105 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
106
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
107 mkdir $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
108 cp $outdir/new_IMGT/* $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
109
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
110 Rscript $dir/tmp/igat.r $outdir/new_IMGT/ $outdir/merged.txt "-" 2>&1
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
111 Rscript $dir/tmp/igat.r $outdir/new_IMGT_ca/ $outdir/merged.txt "ca" 2>&1
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
112 Rscript $dir/tmp/igat.r $outdir/new_IMGT_cg/ $outdir/merged.txt "cg" 2>&1
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
113 Rscript $dir/tmp/igat.r $outdir/new_IMGT_cm/ $outdir/merged.txt "cm" 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
114
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
115
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
116 tmp="$PWD"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
117 cd $outdir/new_IMGT/ #tar weirdness...
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
118 tar -cJf ../new_IMGT.txz *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
119 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT/IgAT.xlsm
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
120 zip -r ../IgAT.zip *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
121
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
122 cd $outdir/new_IMGT_ca/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
123 tar -cJf ../new_IMGT_ca.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
124 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_ca/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
125 zip -r ../IgAT_ca.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
126
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
127 cd $outdir/new_IMGT_cg/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
128 tar -cJf ../new_IMGT_cg.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
129 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_cg/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
130 zip -r ../IgAT_cg.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
131
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
132 cd $outdir/new_IMGT_cm/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
133 tar -cJf ../new_IMGT_cm.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
134 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_cm/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
135 zip -r ../IgAT_cm.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
136
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
137 cd $tmp
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
138
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
139 echo "---------------- mutation_analysis.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
140 echo "---------------- mutation_analysis.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
141
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
142 classes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm,unmatched"
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
143 echo "R mutation analysis"
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
144 Rscript $dir/mutation_analysis.r $outdir/merged.txt $classes $outdir ${include_fr1} 2>&1
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
145
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
146
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
147 echo "---------------- mutation_analysis.py ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
148 echo "---------------- mutation_analysis.py ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
149
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
150 python $dir/mutation_analysis.py --input $outdir/merged.txt --genes $classes --includefr1 "${include_fr1}" --output $outdir/hotspot_analysis.txt
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
151
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
152 echo "---------------- aa_histogram.r ----------------"
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
153 echo "---------------- aa_histogram.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
154
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
155 Rscript $dir/aa_histogram.r $outdir/aa_id_mutations.txt $outdir/absent_aa_id.txt "ca,cg,cm" $outdir/ 2>&1
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
156 if [ -e "$outdir/aa_histogram_.png" ]; then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
157 mv $outdir/aa_histogram_.png $outdir/aa_histogram.png
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
158 mv $outdir/aa_histogram_.txt $outdir/aa_histogram.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
159 fi
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
160
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
161 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
162
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
163 funcs=(sum mean median)
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
164 funcs=(sum)
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
165
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
166 echo "---------------- sequence_overview.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
167 echo "---------------- sequence_overview.r ----------------<br />" >> $log
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
168
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
169 mkdir $outdir/sequence_overview
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
170
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
171 #Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
100
ff5be711382b Uploaded
davidvanzessen
parents: 99
diff changeset
172 Rscript $dir/sequence_overview.r $outdir/before_unique_filter.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
173
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
174 echo "<table border='1'>" > $outdir/base_overview.html
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
175
92
b869a126e2c4 Uploaded
davidvanzessen
parents: 90
diff changeset
176 while IFS=$'\t' read ID class seq A C G T
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
177 do
85
07f7da724a77 Uploaded
davidvanzessen
parents: 84
diff changeset
178 echo "<tr><td>$ID</td><td>$seq</td><td>$class</td><td>$A</td><td>$C</td><td>$G</td><td>$T</td></tr>" >> $outdir/base_overview.html
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
179 done < $outdir/sequence_overview/ntoverview.txt
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
180
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
181 echo "<html><center><h1>$title</h1></center>" > $output
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
182 echo "<script type='text/javascript' src='jquery-1.11.0.min.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
183 echo "<script type='text/javascript' src='tabber.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
184 echo "<script type='text/javascript' src='script.js'></script>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
185 echo "<link rel='stylesheet' type='text/css' href='style.css'>" >> $output
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
186
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
187 #display the matched/unmatched for clearity
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
188
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
189 matched_count="`cat $outdir/merged.txt | grep -v 'unmatched' | tail -n +2 | wc -l`"
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
190 unmatched_count="`cat $outdir/unmatched.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
191 total_count=$((matched_count + unmatched_count))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
192 perc_count=$((unmatched_count / total_count * 100))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
193 perc_count=`bc -l <<< "scale=2; ${unmatched_count} / ${total_count} * 100"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
194 perc_count=`bc -l <<< "scale=2; (${unmatched_count} / ${total_count} * 100 ) / 1"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
195
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
196 echo "<center><h2>Total: ${total_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
197 echo "<center><h2>Matched: ${matched_count} Unmatched: ${unmatched_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
198 echo "<center><h2>Percentage unmatched: ${perc_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
199
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
200 echo "---------------- main tables ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
201 echo "---------------- main tables ----------------<br />" >> $log
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
202
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
203 echo "<div class='tabber'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
204 echo "<div class='tabbertab' title='SHM Overview'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
205
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
206 for func in ${funcs[@]}
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
207 do
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
208
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
209 echo "---------------- $func table ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
210 echo "---------------- $func table ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
211
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
212 cat $outdir/mutations_${func}.txt $outdir/hotspot_analysis_${func}.txt > $outdir/data_${func}.txt
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
213
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
214 echo "<table border='1' width='100%'><caption><h3><a href='data_${func}.txt'>${func} table</a></h3></caption>" >> $output
58
8bb4d6009e08 Uploaded
davidvanzessen
parents: 55
diff changeset
215 echo "<tr><th>info</th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
216 for gene in ${genes[@]}
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
217 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
218 tmp=`cat $outdir/${gene}_${func}_n.txt`
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
219 echo "<th><a href='matched_${gene}_${func}.txt'>${gene} (N = $tmp)</a></th>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
220 done
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
221
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
222 tmp=`cat $outdir/unmatched_${func}_n.txt`
79
0513b46178c4 Uploaded
davidvanzessen
parents: 78
diff changeset
223 echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
224 tmp=`cat $outdir/all_${func}_n.txt`
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
225 echo "<th><a href='matched_all_${func}.txt'>all (N = $tmp)</a></th>" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
226
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
227 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
228 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
229 if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
230 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
231 else
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
232 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${unx}/${uny} (${unz}%)</td><td>${allx}/${ally} (${allz}%)</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
233 fi
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
234 done < $outdir/data_${func}.txt
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
235 echo "</table>" >> $output
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
236 #echo "<a href='data_${func}.txt'>Download data</a>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
237 done
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
238
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
239 echo "</div>" >> $output #SHM overview tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
240
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
241 echo "---------------- images ----------------"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
242 echo "---------------- images ----------------<br />" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
243
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
244 echo "<div class='tabbertab' title='SHM Frequency'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
245
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
246 if [ -a $outdir/scatter.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
247 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
248 echo "<img src='scatter.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
249 echo "<a href='scatter.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
250 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
251 if [ -a $outdir/frequency_ranges.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
252 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
253 echo "<img src='frequency_ranges.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
254 echo "<a href='frequency_ranges_classes.txt'>download class data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
255 echo "<a href='frequency_ranges_subclasses.txt'>download subclass data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
256 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
257
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
258 echo "</div>" >> $output #SHM frequency tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
259
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
260 echo "<div class='tabbertab' title='Transition tables'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
261
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
262 for gene in ${genes[@]}
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
263 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
264 echo "<table border='1'><caption>$gene transition table</caption>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
265 while IFS=, read from a c g t
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
266 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
267 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
268 done < $outdir/transitions_${gene}_sum.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
269 echo "</table>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
270 done
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
271
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
272 echo "<table border='1'><caption>All transition table</caption>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
273 while IFS=, read from a c g t
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
274 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
275 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
276 done < $outdir/transitions_all_sum.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
277 echo "</table>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
278
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
279 echo "</div>" >> $output #transition tables tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
280
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
281 echo "<div class='tabbertab' title='Antigen Selection'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
282
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
283 if [ -a $outdir/aa_histogram.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
284 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
285 echo "<img src='aa_histogram.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
286 echo "<a href='aa_histogram.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
287 echo "<img src='aa_histogram_ca.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
288 echo "<a href='aa_histogram_ca.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
289 echo "<img src='aa_histogram_cg.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
290 echo "<a href='aa_histogram_cg.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
291 echo "<img src='aa_histogram_cm.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
292 echo "<a href='aa_histogram_cm.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
293 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
294
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
295 echo "<embed src='baseline_ca.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
296 echo "<embed src='baseline_cg.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
297 echo "<embed src='baseline_cm.pdf' width='700px' height='1000px'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
298
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
299 echo "</div>" >> $output #antigen selection tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
300
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
301 echo "<div class='tabbertab' title='CSR'>" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
302
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
303 if [ -a $outdir/ca.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
304 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
305 echo "<img src='ca.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
306 echo "<a href='ca.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
307 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
308 if [ -a $outdir/cg.png ]
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
309 then
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
310 echo "<img src='cg.png'/><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
311 echo "<a href='cg.txt'>download data</a><br />" >> $output
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
312 fi
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
313
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
314 echo "</div>" >> $output #CSR tab end
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
315
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
316 echo "<div class='tabbertab' title='Downloads'>" >> $output
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
317
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
318 echo "<a href='unmatched.txt'>unmatched</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
319 echo "<a href='motif_per_seq.txt'>motif per sequence</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
320 echo "<a href='merged.txt'>all data</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
321 echo "<a href='mutation_by_id.txt'>mutations by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
322 echo "<a href='aa_id_mutations.txt'>AA mutations location by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
323 echo "<a href='absent_aa_id.txt'>Absant AA locations by id</a><br />" >> $output
77
c5c86d15cb94 Uploaded
davidvanzessen
parents: 76
diff changeset
324 echo "<a href='sequence_overview/index.html'>Sequence Overview</a><br />" >> $output
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
325 echo "<a href='base_overview.html'>Base overview</a><br />" >> $output
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
326 echo "<a href='baseline.pdf'>Baseline PDF</a><br />" >> $output
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
327 echo "<a href='baseline.txt'>Baseline Table</a><br />" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
328 echo "<a href='baseline_ca.pdf'>Baseline ca PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
329 echo "<a href='baseline_ca.txt'>Baseline ca Table</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
330 echo "<a href='baseline_cg.pdf'>Baseline cg PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
331 echo "<a href='baseline_cg.txt'>Baseline cg Table</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
332 echo "<a href='baseline_cm.pdf'>Baseline cm PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
333 echo "<a href='baseline_cm.txt'>Baseline cm Table</a><br />" >> $output
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
334 echo "<a href='IgAT.zip'>IgAT zip</a><br />" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
335 echo "<a href='IgAT_ca.zip'>IgAT ca zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
336 echo "<a href='IgAT_cg.zip'>IgAT cg zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
337 echo "<a href='IgAT_cm.zip'>IgAT cm zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
338 echo "<a href='new_IMGT.txz'>Filtered IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
339 echo "<a href='new_IMGT_ca.txz'>Filtered ca IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
340 echo "<a href='new_IMGT_cg.txz'>Filtered cg IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
341 echo "<a href='new_IMGT_cm.txz'>Filtered cm IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
342
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
343 echo "</div>" >> $output #downloads tab end
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
344
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
345 echo "</div>" >> $output #tabs end
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
346
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
347 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
348
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
349 echo "---------------- baseline ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
350 echo "---------------- baseline ----------------<br />" >> $log
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
351 tmp="$PWD"
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
352
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
353 mkdir $outdir/baseline
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
354
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
355
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
356 mkdir $outdir/baseline/ca_cg_cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
357 if [[ $(wc -l < $outdir/new_IMGT/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
358 cd $outdir/baseline/ca_cg_cm
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
359 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT.txz "ca_cg_cm" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline.pdf" "Sequence.ID" "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
360 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
361 echo "No sequences" > "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
362 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
363
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
364 mkdir $outdir/baseline/ca
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
365 if [[ $(wc -l < $outdir/new_IMGT_ca/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
366 cd $outdir/baseline/ca
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
367 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_ca.txz "ca" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_ca.pdf" "Sequence.ID" "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
368 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
369 echo "No ca sequences" > "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
370 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
371
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
372 mkdir $outdir/baseline/cg
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
373 if [[ $(wc -l < $outdir/new_IMGT_cg/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
374 cd $outdir/baseline/cg
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
375 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cg.txz "cg" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cg.pdf" "Sequence.ID" "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
376 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
377 echo "No cg sequences" > "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
378 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
379
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
380 mkdir $outdir/baseline/cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
381 if [[ $(wc -l < $outdir/new_IMGT_cm/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
382 cd $outdir/baseline/cm
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
383 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cm.txz "cm" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cm.pdf" "Sequence.ID" "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
384 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
385 echo "No cm sequences" > "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
386 fi
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
387
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
388 cd $tmp
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
389
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
390 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
391 echo "---------------- naive_output.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
392
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
393 if [[ "$naive_output" != "None" ]]
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
394 then
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
395 echo "---------------- imgt_loader.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
396 echo "---------------- imgt_loader.r ----------------<br />" >> $log
50
8ba6afa1247a Uploaded
davidvanzessen
parents: 49
diff changeset
397 #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output
80
a4c2ddeadec0 Uploaded
davidvanzessen
parents: 79
diff changeset
398 Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
399
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
400 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
401 echo "---------------- naive_output.r ----------------<br />" >> $log
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
402 Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
403 fi
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
404
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
405 echo "</table>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
406
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
407 mv $log $outdir/log.html
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
408
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
409 echo "<html><center><h1><a href='index.html'>Click here for the results</a></h1>Tip: Open it in a new tab (middle mouse button or right mouse button -> 'open in new tab' on the link above)<br />" > $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
410 echo "<table border = 1>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
411 echo "<thead><tr><th>Info</th><th>Sequences</th><th>Percentage</th></tr></thead>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
412 tIFS="$TMP"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
413 IFS=$'\t'
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
414 while read step seq perc
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
415 do
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
416 echo "<tr>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
417 echo "<td>$step</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
418 echo "<td>$seq</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
419 echo "<td>${perc}%</td>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
420 echo "</tr>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
421 done < $outdir/filtering_steps.txt
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
422 echo "</table border></center></html>" >> $log
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
423
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
424 IFS="$tIFS"
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
425
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
426
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
427 echo "---------------- Done! ----------------"
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
428 echo "---------------- Done! ----------------<br />" >> $outdir/log.html
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
429
110
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
430
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
431
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
432
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
433
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
434
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
435
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
436
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
437
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
438
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
439
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
440
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
441
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
442
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
443
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
444
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
445
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
446
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
447
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
448
ade5cf6fd2dc Uploaded
davidvanzessen
parents: 108
diff changeset
449