annotate wrapper.sh @ 107:01c9993865af draft

Uploaded
author davidvanzessen
date Wed, 13 Jul 2016 08:04:13 -0400
parents e4957ad476a2
children 6add3e66f4fa
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
2 set -e
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
5 method=$2
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
6 log=$3 #becomes the main html page at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
7 outdir=$4
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
8 output="$outdir/index.html" #copied to $log location at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
9 title=$5
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
10 include_fr1=$6
34
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
11 functionality=$7
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
12 unique=$8
69
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
13 naive_output_ca=$9
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
14 naive_output_cg=${10}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
15 naive_output_cm=${11}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
16 filter_unique=${12}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
17 class_filter=${13}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
20 echo "---------------- read parameters ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
21 echo "---------------- read parameters ----------------<br />" > $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
22
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
23 echo "unpacking IMGT file"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
24
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
25
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
26
35
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
27 type="`file $input`"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
28 if [[ "$type" == *"Zip archive"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
29 echo "Zip archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
30 echo "unzip $input -d $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
31 unzip $input -d $PWD/files/
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
32 elif [[ "$type" == *"XZ compressed data"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
33 echo "ZX archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
34 echo "tar -xJf $input -C $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
35 mkdir -p $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
36 tar -xJf $input -C $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
37 fi
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
38
64
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
39 cat `find $PWD/files/ -name "1_*"` > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
40 cat `find $PWD/files/ -name "3_*"` > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
41 cat `find $PWD/files/ -name "5_*"` > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
42 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
43 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
44 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
45 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
46
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
47 #cat $PWD/files/*/1_* > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
48 #cat $PWD/files/*/3_* > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
49 #cat $PWD/files/*/5_* > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
50 #cat $PWD/files/*/6_* > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
51 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
52 #cat $PWD/files/*/8_* > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
53 #cat $PWD/files/*/10_* > $PWD/hotspots.txt
3
a0b27058dcac Uploaded
davidvanzessen
parents: 2
diff changeset
54
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
55 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
56
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
57 echo "${BLASTN_DIR}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
58
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
59 echo "---------------- identification ($method) ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
60 echo "---------------- identification ($method) ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
61
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
62 if [[ "${method}" == "custom" ]] ; then
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
63 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
64 else
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
65 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
66 ID_index=$((ID_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
67 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
68 sequence_index=$((sequence_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
69
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
70 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.fasta
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
71
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
72 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
73 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
74 fi
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
75
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
76 echo "---------------- merge_and_filter.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
77 echo "---------------- merge_and_filter.r ----------------<br />" >> $log
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
78
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
79 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/sequences.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/before_unique_filter.txt $outdir/unmatched.txt $method $functionality $unique ${filter_unique} ${class_filter} 2>&1
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
80
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
81 echo "---------------- creating new IMGT zip ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
82 echo "---------------- creating new IMGT zip ----------------<br />" >> $log
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
83
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
84 mkdir $outdir/new_IMGT
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
85
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
86 cat `find $PWD/files/ -name "1_*"` > "$outdir/new_IMGT/1_Summary.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
87 cat `find $PWD/files/ -name "2_*"` > "$outdir/new_IMGT/2_IMGT-gapped-nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
88 cat `find $PWD/files/ -name "3_*"` > "$outdir/new_IMGT/3_Nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
89 cat `find $PWD/files/ -name "4_*"` > "$outdir/new_IMGT/4_IMGT-gapped-AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
90 cat `find $PWD/files/ -name "5_*"` > "$outdir/new_IMGT/5_AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
91 cat `find $PWD/files/ -name "6_*"` > "$outdir/new_IMGT/6_Junction.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
92 cat `find $PWD/files/ -name "7_*"` > "$outdir/new_IMGT/7_V-REGION-mutation-and-AA-change-table.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
93 cat `find $PWD/files/ -name "8_*"` > "$outdir/new_IMGT/8_V-REGION-nt-mutation-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
94 cat `find $PWD/files/ -name "9_*"` > "$outdir/new_IMGT/9_V-REGION-AA-change-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
95 cat `find $PWD/files/ -name "10_*"` > "$outdir/new_IMGT/10_V-REGION-mutation-hotspots.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
96
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
97 mkdir $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
98 cp $outdir/new_IMGT/* $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
100 mkdir $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
101 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
102
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
103 mkdir $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
104 cp $outdir/new_IMGT/* $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
105
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
106 Rscript $dir/tmp/igat.r $outdir/new_IMGT/ $outdir/merged.txt "-" 2>&1
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
107 Rscript $dir/tmp/igat.r $outdir/new_IMGT_ca/ $outdir/merged.txt "ca" 2>&1
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
108 Rscript $dir/tmp/igat.r $outdir/new_IMGT_cg/ $outdir/merged.txt "cg" 2>&1
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
109 Rscript $dir/tmp/igat.r $outdir/new_IMGT_cm/ $outdir/merged.txt "cm" 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
110
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
111
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
112 tmp="$PWD"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
113 cd $outdir/new_IMGT/ #tar weirdness...
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
114 tar -cJf ../new_IMGT.txz *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
115 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT/IgAT.xlsm
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
116 zip -r ../IgAT.zip *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
117
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
118 cd $outdir/new_IMGT_ca/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
119 tar -cJf ../new_IMGT_ca.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
120 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_ca/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
121 zip -r ../IgAT_ca.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
122
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
123 cd $outdir/new_IMGT_cg/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
124 tar -cJf ../new_IMGT_cg.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
125 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_cg/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
126 zip -r ../IgAT_cg.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
127
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
128 cd $outdir/new_IMGT_cm/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
129 tar -cJf ../new_IMGT_cm.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
130 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_cm/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
131 zip -r ../IgAT_cm.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
132
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
133 cd $tmp
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
134
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
135 echo "---------------- mutation_analysis.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
136 echo "---------------- mutation_analysis.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
137
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
138 classes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm,unmatched"
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
139 echo "R mutation analysis"
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
140 Rscript $dir/mutation_analysis.r $outdir/merged.txt $classes $outdir ${include_fr1} 2>&1
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
141
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
142
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
143 echo "---------------- mutation_analysis.py ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
144 echo "---------------- mutation_analysis.py ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
145
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
146 python $dir/mutation_analysis.py --input $outdir/merged.txt --genes $classes --includefr1 "${include_fr1}" --output $outdir/hotspot_analysis.txt
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
147
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
148 echo "---------------- aa_histogram.r ----------------"
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
149 echo "---------------- aa_histogram.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
150
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
151 cp $outdir/aa_mutations.txt $outdir/aa_mutations_count.txt
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
152 Rscript $dir/aa_histogram.r $outdir/aa_id_mutations.txt $outdir/absent_aa_id.txt "ca,cg,cm" $outdir/ 2>&1
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
153 mv $outdir/aa_histogram_.png $outdir/aa_histogram.png
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
154
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
155 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
156
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
157 funcs=(sum mean median)
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
158
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
159 echo "---------------- sequence_overview.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
160 echo "---------------- sequence_overview.r ----------------<br />" >> $log
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
161
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
162 mkdir $outdir/sequence_overview
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
163
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
164 #Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
100
ff5be711382b Uploaded
davidvanzessen
parents: 99
diff changeset
165 Rscript $dir/sequence_overview.r $outdir/before_unique_filter.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
166
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
167 echo "<table border='1'>" > $outdir/base_overview.html
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
168
92
b869a126e2c4 Uploaded
davidvanzessen
parents: 90
diff changeset
169 while IFS=$'\t' read ID class seq A C G T
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
170 do
85
07f7da724a77 Uploaded
davidvanzessen
parents: 84
diff changeset
171 echo "<tr><td>$ID</td><td>$seq</td><td>$class</td><td>$A</td><td>$C</td><td>$G</td><td>$T</td></tr>" >> $outdir/base_overview.html
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
172 done < $outdir/sequence_overview/ntoverview.txt
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
173
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
174 echo "<html><center><h1>$title</h1></center>" > $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
175
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
176 #display the matched/unmatched for clearity
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
177
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
178 matched_count="`cat $outdir/merged.txt | grep -v 'unmatched' | tail -n +2 | wc -l`"
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
179 unmatched_count="`cat $outdir/unmatched.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
180 total_count=$((matched_count + unmatched_count))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
181 perc_count=$((unmatched_count / total_count * 100))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
182 perc_count=`bc -l <<< "scale=2; ${unmatched_count} / ${total_count} * 100"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
183 perc_count=`bc -l <<< "scale=2; (${unmatched_count} / ${total_count} * 100 ) / 1"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
184
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
185 echo "<center><h2>Total: ${total_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
186 echo "<center><h2>Matched: ${matched_count} Unmatched: ${unmatched_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
187 echo "<center><h2>Percentage unmatched: ${perc_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
188
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
189 echo "---------------- main tables ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
190 echo "---------------- main tables ----------------<br />" >> $log
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
191 for func in ${funcs[@]}
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
192 do
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
193
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
194 echo "---------------- $func table ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
195 echo "---------------- $func table ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
196
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
197 cat $outdir/mutations_${func}.txt $outdir/hotspot_analysis_${func}.txt > $outdir/data_${func}.txt
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
198
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
199 echo "<table border='1' width='100%'><caption><h3><a href='data_${func}.txt'>${func} table</a></h3></caption>" >> $output
58
8bb4d6009e08 Uploaded
davidvanzessen
parents: 55
diff changeset
200 echo "<tr><th>info</th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
201 for gene in ${genes[@]}
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
202 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
203 tmp=`cat $outdir/${gene}_${func}_n.txt`
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
204 echo "<th><a href='matched_${gene}_${func}.txt'>${gene} (N = $tmp)</a></th>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
205 done
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
206
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
207 tmp=`cat $outdir/unmatched_${func}_n.txt`
79
0513b46178c4 Uploaded
davidvanzessen
parents: 78
diff changeset
208 echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
209 tmp=`cat $outdir/all_${func}_n.txt`
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
210 echo "<th><a href='matched_all_${func}.txt'>all (N = $tmp)</a></th>" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
211
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
212 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
213 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
214 if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
215 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
216 else
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
217 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${unx}/${uny} (${unz}%)</td><td>${allx}/${ally} (${allz}%)</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
218 fi
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
219 done < $outdir/data_${func}.txt
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
220 echo "</table>" >> $output
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
221 #echo "<a href='data_${func}.txt'>Download data</a>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
222 done
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
223
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
224 echo "---------------- download links ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
225 echo "---------------- download links ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
226
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
227
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
228 echo "<a href='unmatched.txt'>unmatched</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
229 echo "<a href='motif_per_seq.txt'>motif per sequence</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
230 echo "<a href='merged.txt'>all data</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
231 echo "<a href='mutation_by_id.txt'>mutations by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
232 echo "<a href='aa_id_mutations.txt'>AA mutations location by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
233 echo "<a href='absent_aa_id.txt'>Absant AA locations by id</a><br />" >> $output
77
c5c86d15cb94 Uploaded
davidvanzessen
parents: 76
diff changeset
234 echo "<a href='sequence_overview/index.html'>Sequence Overview</a><br />" >> $output
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
235 echo "<a href='base_overview.html'>Base overview</a><br />" >> $output
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
236 echo "<a href='baseline.pdf'>Baseline PDF</a><br />" >> $output
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
237 echo "<a href='baseline.txt'>Baseline Table</a><br />" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
238 echo "<a href='baseline_ca.pdf'>Baseline ca PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
239 echo "<a href='baseline_ca.txt'>Baseline ca Table</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
240 echo "<a href='baseline_cg.pdf'>Baseline cg PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
241 echo "<a href='baseline_cg.txt'>Baseline cg Table</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
242 echo "<a href='baseline_cm.pdf'>Baseline cm PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
243 echo "<a href='baseline_cm.txt'>Baseline cm Table</a><br />" >> $output
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
244 echo "<a href='IgAT.zip'>IgAT zip</a><br />" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
245 echo "<a href='IgAT_ca.zip'>IgAT ca zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
246 echo "<a href='IgAT_cg.zip'>IgAT cg zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
247 echo "<a href='IgAT_cm.zip'>IgAT cm zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
248 echo "<a href='new_IMGT.txz'>Filtered IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
249 echo "<a href='new_IMGT_ca.txz'>Filtered ca IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
250 echo "<a href='new_IMGT_cg.txz'>Filtered cg IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
251 echo "<a href='new_IMGT_cm.txz'>Filtered cm IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
252
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
253
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
254 echo "---------------- images ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
255 echo "---------------- images ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
256
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
257 echo "<img src='all.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
258 echo "<a href='all.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
259 if [ -a $outdir/ca.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
260 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
261 echo "<img src='ca.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
262 echo "<a href='ca.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
263 fi
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
264 if [ -a $outdir/cg.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
265 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
266 echo "<img src='cg.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
267 echo "<a href='cg.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
268 fi
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
269 if [ -a $outdir/scatter.png ]
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
270 then
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
271 echo "<img src='scatter.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
272 echo "<a href='scatter.txt'>download data</a><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
273 fi
49
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
274 if [ -a $outdir/frequency_ranges.png ]
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
275 then
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
276 echo "<img src='frequency_ranges.png'/><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
277 echo "<a href='frequency_ranges_classes.txt'>download class data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
278 echo "<a href='frequency_ranges_subclasses.txt'>download subclass data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
279 fi
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
280 if [ -a $outdir/aa_histogram.png ]
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
281 then
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
282 echo "<img src='aa_histogram.png'/><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
283 echo "<a href='aa_histogram.txt'>download data</a><br />" >> $output
104
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
284 echo "<img src='aa_histogram_ca.png'/><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
285 echo "<a href='aa_histogram_ca.txt'>download data</a><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
286 echo "<img src='aa_histogram_cg.png'/><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
287 echo "<a href='aa_histogram_cg.txt'>download data</a><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
288 echo "<img src='aa_histogram_cm.png'/><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
289 echo "<a href='aa_histogram_cm.txt'>download data</a><br />" >> $output
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
290 fi
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
291
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
292 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
293 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
294 echo "<table border='1'><caption>$gene transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
295 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
296 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
297 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
298 done < $outdir/transitions_${gene}_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
299 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
300 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
301
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
302 echo "<table border='1'><caption>All transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
303 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
304 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
305 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
306 done < $outdir/transitions_all_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
307 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
308
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
309 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
310
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
311 echo "---------------- baseline ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
312 echo "---------------- baseline ----------------<br />" >> $log
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
313 tmp="$PWD"
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
314
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
315 mkdir $outdir/baseline
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
316
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
317
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
318 mkdir $outdir/baseline/ca_cg_cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
319 if [[ $(wc -l < $outdir/new_IMGT/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
320 cd $outdir/baseline/ca_cg_cm
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
321 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT.txz "ca_cg_cm" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline.pdf" "Sequence.ID" "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
322 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
323 echo "No sequences" > "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
324 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
325
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
326 mkdir $outdir/baseline/ca
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
327 if [[ $(wc -l < $outdir/new_IMGT_ca/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
328 cd $outdir/baseline/ca
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
329 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_ca.txz "ca" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_ca.pdf" "Sequence.ID" "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
330 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
331 echo "No ca sequences" > "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
332 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
333
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
334 mkdir $outdir/baseline/cg
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
335 if [[ $(wc -l < $outdir/new_IMGT_cg/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
336 cd $outdir/baseline/cg
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
337 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cg.txz "cg" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cg.pdf" "Sequence.ID" "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
338 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
339 echo "No cg sequences" > "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
340 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
341
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
342 mkdir $outdir/baseline/cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
343 if [[ $(wc -l < $outdir/new_IMGT_cm/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
344 cd $outdir/baseline/cm
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
345 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cm.txz "cm" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cm.pdf" "Sequence.ID" "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
346 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
347 echo "No cm sequences" > "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
348 fi
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
349
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
350 cd $tmp
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
351
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
352 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
353 echo "---------------- naive_output.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
354
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
355 if [[ "$naive_output" != "None" ]]
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
356 then
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
357 echo "---------------- imgt_loader.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
358 echo "---------------- imgt_loader.r ----------------<br />" >> $log
50
8ba6afa1247a Uploaded
davidvanzessen
parents: 49
diff changeset
359 #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output
80
a4c2ddeadec0 Uploaded
davidvanzessen
parents: 79
diff changeset
360 Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
361
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
362 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
363 echo "---------------- naive_output.r ----------------<br />" >> $log
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
364 Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
365 fi
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
366
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
367 echo "</table>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
368
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
369 mv $log $outdir/log.html
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
370
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
371 cp $outdir/index.html $log
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
372
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
373 echo "---------------- Done! ----------------"
107
01c9993865af Uploaded
davidvanzessen
parents: 105
diff changeset
374 echo "---------------- Done! ----------------<br />" >> $outdir/log.html
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
375