annotate wrapper.sh @ 95:a66eb1c5374c draft

Uploaded
author davidvanzessen
date Wed, 08 Jun 2016 03:54:49 -0400
parents e39176ccddc8
children 5ffbf40cdd4b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
2 set -e
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
5 method=$2
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
6 output=$3
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
7 outdir=$4
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
8 title=$5
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
9 include_fr1=$6
34
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
10 functionality=$7
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
11 unique=$8
69
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
12 naive_output_ca=$9
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
13 naive_output_cg=${10}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
14 naive_output_cm=${11}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
15 filter_unique=${12}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
16 class_filter=${13}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
17 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
19 echo "---------------- read parameters ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
20 echo "---------------- read parameters ----------------<br />" > $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
21
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
22 echo "unpacking IMGT file"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
23
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
24
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
25
35
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
26 type="`file $input`"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
27 if [[ "$type" == *"Zip archive"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
28 echo "Zip archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
29 echo "unzip $input -d $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
30 unzip $input -d $PWD/files/
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
31 elif [[ "$type" == *"XZ compressed data"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
32 echo "ZX archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
33 echo "tar -xJf $input -C $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
34 mkdir -p $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
35 tar -xJf $input -C $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
36 fi
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
37
64
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
38 cat `find $PWD/files/ -name "1_*"` > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
39 cat `find $PWD/files/ -name "3_*"` > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
40 cat `find $PWD/files/ -name "5_*"` > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
41 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
42 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
43 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
44 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
45
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
46 #cat $PWD/files/*/1_* > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
47 #cat $PWD/files/*/3_* > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
48 #cat $PWD/files/*/5_* > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
49 #cat $PWD/files/*/6_* > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
50 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
51 #cat $PWD/files/*/8_* > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
52 #cat $PWD/files/*/10_* > $PWD/hotspots.txt
3
a0b27058dcac Uploaded
davidvanzessen
parents: 2
diff changeset
53
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
54 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
55
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
56 echo "${BLASTN_DIR}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
57
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
58 echo "---------------- identification ($method) ----------------"
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
59 echo "---------------- identification ($method) ----------------<br />" >> $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
60
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
61 if [[ "${method}" == "custom" ]] ; then
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
62 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
63 else
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
64 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
65 ID_index=$((ID_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
66 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
67 sequence_index=$((sequence_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
68
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
69 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.fasta
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
70
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
71 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
72 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
73 fi
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
74
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
75 echo "---------------- merge_and_filter.r ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
76 echo "---------------- merge_and_filter.r ----------------<br />" >> $output
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
77
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
78 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/sequences.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/before_unique_filter.txt $outdir/unmatched.txt $method $functionality $unique ${filter_unique} ${class_filter} 2>&1
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
79
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
80 echo "---------------- creating new IMGT zip ----------------<br />"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
81 echo "---------------- creating new IMGT zip ----------------<br />" >> $output
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
82
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
83 mkdir $outdir/new_IMGT
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
84
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
85 cat `find $PWD/files/ -name "1_*"` > "$outdir/new_IMGT/1_Summary.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
86 cat `find $PWD/files/ -name "2_*"` > "$outdir/new_IMGT/2_IMGT-gapped-nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
87 cat `find $PWD/files/ -name "3_*"` > "$outdir/new_IMGT/3_Nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
88 cat `find $PWD/files/ -name "4_*"` > "$outdir/new_IMGT/4_IMGT-gapped-AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
89 cat `find $PWD/files/ -name "5_*"` > "$outdir/new_IMGT/5_AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
90 cat `find $PWD/files/ -name "6_*"` > "$outdir/new_IMGT/6_Junction.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
91 cat `find $PWD/files/ -name "7_*"` > "$outdir/new_IMGT/7_V-REGION-mutation-and-AA-change-table.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
92 cat `find $PWD/files/ -name "8_*"` > "$outdir/new_IMGT/8_V-REGION-nt-mutation-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
93 cat `find $PWD/files/ -name "9_*"` > "$outdir/new_IMGT/9_V-REGION-AA-change-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
94 cat `find $PWD/files/ -name "10_*"` > "$outdir/new_IMGT/10_V-REGION-mutation-hotspots.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
96 Rscript $dir/tmp/igat.r $outdir/new_IMGT/ $outdir/merged.txt 2>&1
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
97
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
98
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
99 tmp="$PWD"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
100 cd $outdir/new_IMGT/ #tar weirdness...
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
101 tar -cJf ../new_IMGT.txz *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
102
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
103 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT/IgAT.xlsm
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
104
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
105 #tar -cJf ../IgAT.txz *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
106 zip -r ../IgAT.zip *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
107
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
108 cd $tmp
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
109
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
110
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
111 echo "---------------- mutation_analysis.r ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
112 echo "---------------- mutation_analysis.r ----------------<br />" >> $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
113
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
114 classes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm,unmatched"
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
115 echo "R mutation analysis"
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
116 Rscript $dir/mutation_analysis.r $outdir/merged.txt $classes $outdir ${include_fr1} 2>&1
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
117
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
118
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
119 echo "---------------- mutation_analysis.py ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
120 echo "---------------- mutation_analysis.py ----------------<br />" >> $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
121
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
122 python $dir/mutation_analysis.py --input $outdir/merged.txt --genes $classes --includefr1 "${include_fr1}" --output $outdir/hotspot_analysis.txt
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
123
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
124 echo "---------------- aa_histogram.r ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
125 echo "---------------- aa_histogram.r ----------------<br />" >> $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
126
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
127 Rscript $dir/aa_histogram.r $outdir/aa_mutations.txt $outdir/aa_histogram.png 2>&1
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
128
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
129 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
130
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
131 funcs=(sum mean median)
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
132
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
133 echo "---------------- sequence_overview.r ----------------"
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
134 echo "---------------- sequence_overview.r ----------------" >> $output
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
135
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
136 mkdir $outdir/sequence_overview
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
137
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
138 #Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
139 Rscript $dir/sequence_overview.r $outdir/before_unique_filter.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
140
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
141 echo "<table border='1'>" > $outdir/base_overview.html
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
142
92
b869a126e2c4 Uploaded
davidvanzessen
parents: 90
diff changeset
143 while IFS=$'\t' read ID class seq A C G T
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
144 do
85
07f7da724a77 Uploaded
davidvanzessen
parents: 84
diff changeset
145 echo "<tr><td>$ID</td><td>$seq</td><td>$class</td><td>$A</td><td>$C</td><td>$G</td><td>$T</td></tr>" >> $outdir/base_overview.html
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
146 done < $outdir/sequence_overview/ntoverview.txt
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
147
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
148
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
149 echo "<html><center><h1>$title</h1></center>" > $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
150
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
151 #display the matched/unmatched for clearity
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
152
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
153 matched_count="`cat $outdir/merged.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
154 unmatched_count="`cat $outdir/unmatched.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
155 total_count=$((matched_count + unmatched_count))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
156 perc_count=$((unmatched_count / total_count * 100))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
157 perc_count=`bc -l <<< "scale=2; ${unmatched_count} / ${total_count} * 100"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
158 perc_count=`bc -l <<< "scale=2; (${unmatched_count} / ${total_count} * 100 ) / 1"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
159
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
160 echo "<center><h2>Total: ${total_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
161 echo "<center><h2>Matched: ${matched_count} Unmatched: ${unmatched_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
162 echo "<center><h2>Percentage unmatched: ${perc_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
163
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
164 echo "---------------- main tables ----------------"
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
165 for func in ${funcs[@]}
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
166 do
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
167
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
168 echo "---------------- $func table ----------------"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
169
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
170 cat $outdir/mutations_${func}.txt $outdir/hotspot_analysis_${func}.txt > $outdir/data_${func}.txt
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
171
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
172 echo "<table border='1' width='100%'><caption><h3>${func} table</h3></caption>" >> $output
58
8bb4d6009e08 Uploaded
davidvanzessen
parents: 55
diff changeset
173 echo "<tr><th>info</th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
174 for gene in ${genes[@]}
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
175 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
176 tmp=`cat $outdir/${gene}_${func}_n.txt`
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
177 echo "<th><a href='matched_${gene}_${func}.txt'>${gene} (N = $tmp)</a></th>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
178 done
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
179
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
180 tmp=`cat $outdir/unmatched_${func}_n.txt`
79
0513b46178c4 Uploaded
davidvanzessen
parents: 78
diff changeset
181 echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
182 tmp=`cat $outdir/all_${func}_n.txt`
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
183 echo "<th><a href='matched_all_${func}.txt'>all (N = $tmp)</a></th>" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
184
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
185 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
186 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
187 if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
188 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
189 else
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
190 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${unx}/${uny} (${unz}%)</td><td>${allx}/${ally} (${allz}%)</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
191 fi
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
192 done < $outdir/data_${func}.txt
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
193 echo "</table>" >> $output
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
194 #echo "<a href='data_${func}.txt'>Download data</a>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
195 done
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
196
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
197 echo "---------------- download links ----------------"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
198
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
199
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
200 echo "<a href='unmatched.txt'>unmatched</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
201 echo "<a href='motif_per_seq.txt'>motif per sequence</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
202 echo "<a href='merged.txt'>all data</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
203 echo "<a href='mutation_by_id.txt'>mutations by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
204 echo "<a href='aa_id_mutations.txt'>AA mutations location by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
205 echo "<a href='absent_aa_id.txt'>Absant AA locations by id</a><br />" >> $output
77
c5c86d15cb94 Uploaded
davidvanzessen
parents: 76
diff changeset
206 echo "<a href='sequence_overview/index.html'>Sequence Overview</a><br />" >> $output
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
207 echo "<a href='base_overview.html'>Base overview</a><br />" >> $output
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
208 echo "<a href='baseline.pdf'>Baseline PDF</a><br />" >> $output
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
209 echo "<a href='baseline.txt'>Baseline Table</a><br />" >> $output
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
210 echo "<a href='IgAT.zip'>IgAT zip</a><br />" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
211
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
212 echo "---------------- images ----------------"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
213
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
214 echo "<img src='all.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
215 echo "<a href='all.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
216 if [ -a $outdir/ca.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
217 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
218 echo "<img src='ca.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
219 echo "<a href='ca.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
220 fi
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
221 if [ -a $outdir/cg.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
222 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
223 echo "<img src='cg.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
224 echo "<a href='cg.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
225 fi
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
226 if [ -a $outdir/scatter.png ]
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
227 then
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
228 echo "<img src='scatter.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
229 echo "<a href='scatter.txt'>download data</a><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
230 fi
49
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
231 if [ -a $outdir/frequency_ranges.png ]
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
232 then
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
233 echo "<img src='frequency_ranges.png'/><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
234 echo "<a href='frequency_ranges_classes.txt'>download class data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
235 echo "<a href='frequency_ranges_subclasses.txt'>download subclass data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
236 fi
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
237 if [ -a $outdir/aa_histogram.png ]
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
238 then
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
239 echo "<img src='aa_histogram.png'/><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
240 echo "<a href='aa_histogram.txt'>download data</a><br />" >> $output
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
241 fi
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
242
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
243 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
244 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
245 echo "<table border='1'><caption>$gene transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
246 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
247 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
248 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
249 done < $outdir/transitions_${gene}_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
250 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
251 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
252
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
253 echo "<table border='1'><caption>All transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
254 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
255 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
256 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
257 done < $outdir/transitions_all_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
258 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
259
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
260 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
261
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
262 echo "---------------- baseline ----------------"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
263 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT.txz "sample name" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline.pdf" "Sequence.ID" "$outdir/baseline.txt"
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
264
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
265 #optional output for naive
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
266
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
267 echo "---------------- naive_output.r ----------------"
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
268
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
269 if [[ "$naive_output" != "None" ]]
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
270 then
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
271 echo "---------------- imgt_loader.r ----------------"
50
8ba6afa1247a Uploaded
davidvanzessen
parents: 49
diff changeset
272 #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output
80
a4c2ddeadec0 Uploaded
davidvanzessen
parents: 79
diff changeset
273 Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
274
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
275 echo "---------------- naive_output.r ----------------"
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
276 Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
277 fi
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
278
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
279 echo "</table>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
280
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
281 echo "---------------- Done! ----------------"
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
282
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
283
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
284
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
285
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
286
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
287
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
288
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
289 #rm $outdir/HS12RSS.txt
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
290 #rm $outdir/HS23RSS.txt