annotate wrapper.sh @ 105:e4957ad476a2 draft

Uploaded
author davidvanzessen
date Thu, 23 Jun 2016 03:58:03 -0400
parents 603a10976e9c
children 01c9993865af
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
2 set -e
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
5 method=$2
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
6 log=$3 #becomes the main html page at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
7 outdir=$4
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
8 output="$outdir/index.html" #copied to $log location at the end
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
9 title=$5
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
10 include_fr1=$6
34
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
11 functionality=$7
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
12 unique=$8
69
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
13 naive_output_ca=$9
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
14 naive_output_cg=${10}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
15 naive_output_cm=${11}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
16 filter_unique=${12}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
17 class_filter=${13}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
20 echo "---------------- read parameters ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
21 echo "---------------- read parameters ----------------<br />" > $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
22
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
23 echo "unpacking IMGT file"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
24
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
25
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
26
35
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
27 type="`file $input`"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
28 if [[ "$type" == *"Zip archive"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
29 echo "Zip archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
30 echo "unzip $input -d $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
31 unzip $input -d $PWD/files/
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
32 elif [[ "$type" == *"XZ compressed data"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
33 echo "ZX archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
34 echo "tar -xJf $input -C $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
35 mkdir -p $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
36 tar -xJf $input -C $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
37 fi
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
38
64
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
39 cat `find $PWD/files/ -name "1_*"` > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
40 cat `find $PWD/files/ -name "3_*"` > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
41 cat `find $PWD/files/ -name "5_*"` > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
42 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
43 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
44 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
45 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
46
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
47 #cat $PWD/files/*/1_* > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
48 #cat $PWD/files/*/3_* > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
49 #cat $PWD/files/*/5_* > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
50 #cat $PWD/files/*/6_* > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
51 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
52 #cat $PWD/files/*/8_* > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
53 #cat $PWD/files/*/10_* > $PWD/hotspots.txt
3
a0b27058dcac Uploaded
davidvanzessen
parents: 2
diff changeset
54
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
55 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
56
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
57 echo "${BLASTN_DIR}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
58
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
59 echo "---------------- identification ($method) ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
60 echo "---------------- identification ($method) ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
61
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
62 if [[ "${method}" == "custom" ]] ; then
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
63 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
64 else
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
65 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
66 ID_index=$((ID_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
67 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
68 sequence_index=$((sequence_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
69
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
70 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.fasta
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
71
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
72 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
73 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
74 fi
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
75
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
76 echo "---------------- merge_and_filter.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
77 echo "---------------- merge_and_filter.r ----------------<br />" >> $log
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
78
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
79 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/sequences.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/before_unique_filter.txt $outdir/unmatched.txt $method $functionality $unique ${filter_unique} ${class_filter} 2>&1
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
80
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
81 echo "---------------- creating new IMGT zip ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
82 echo "---------------- creating new IMGT zip ----------------<br />" >> $log
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
83
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
84 mkdir $outdir/new_IMGT
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
85
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
86 cat `find $PWD/files/ -name "1_*"` > "$outdir/new_IMGT/1_Summary.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
87 cat `find $PWD/files/ -name "2_*"` > "$outdir/new_IMGT/2_IMGT-gapped-nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
88 cat `find $PWD/files/ -name "3_*"` > "$outdir/new_IMGT/3_Nt-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
89 cat `find $PWD/files/ -name "4_*"` > "$outdir/new_IMGT/4_IMGT-gapped-AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
90 cat `find $PWD/files/ -name "5_*"` > "$outdir/new_IMGT/5_AA-sequences.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
91 cat `find $PWD/files/ -name "6_*"` > "$outdir/new_IMGT/6_Junction.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
92 cat `find $PWD/files/ -name "7_*"` > "$outdir/new_IMGT/7_V-REGION-mutation-and-AA-change-table.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
93 cat `find $PWD/files/ -name "8_*"` > "$outdir/new_IMGT/8_V-REGION-nt-mutation-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
94 cat `find $PWD/files/ -name "9_*"` > "$outdir/new_IMGT/9_V-REGION-AA-change-statistics.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
95 cat `find $PWD/files/ -name "10_*"` > "$outdir/new_IMGT/10_V-REGION-mutation-hotspots.txt"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
96
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
97 mkdir $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
98 cp $outdir/new_IMGT/* $outdir/new_IMGT_ca
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
100 mkdir $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
101 cp $outdir/new_IMGT/* $outdir/new_IMGT_cg
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
102
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
103 mkdir $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
104 cp $outdir/new_IMGT/* $outdir/new_IMGT_cm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
105
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
106 Rscript $dir/tmp/igat.r $outdir/new_IMGT/ $outdir/merged.txt "-" 2>&1
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
107 Rscript $dir/tmp/igat.r $outdir/new_IMGT_ca/ $outdir/merged.txt "ca" 2>&1
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
108 Rscript $dir/tmp/igat.r $outdir/new_IMGT_cg/ $outdir/merged.txt "cg" 2>&1
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
109 Rscript $dir/tmp/igat.r $outdir/new_IMGT_cm/ $outdir/merged.txt "cm" 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
110
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
111
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
112 tmp="$PWD"
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
113 cd $outdir/new_IMGT/ #tar weirdness...
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
114 tar -cJf ../new_IMGT.txz *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
115 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT/IgAT.xlsm
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
116 zip -r ../IgAT.zip *
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
117
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
118 cd $outdir/new_IMGT_ca/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
119 tar -cJf ../new_IMGT_ca.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
120 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_ca/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
121 zip -r ../IgAT_ca.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
122
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
123 cd $outdir/new_IMGT_cg/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
124 tar -cJf ../new_IMGT_cg.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
125 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_cg/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
126 zip -r ../IgAT_cg.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
127
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
128 cd $outdir/new_IMGT_cm/
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
129 tar -cJf ../new_IMGT_cm.txz *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
130 cp $dir/tmp/IgAT.xlsm $outdir/new_IMGT_cm/IgAT.xlsm
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
131 zip -r ../IgAT_cm.zip *
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
132
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
133 cd $tmp
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
134
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
135 echo "---------------- mutation_analysis.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
136 echo "---------------- mutation_analysis.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
137
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
138 classes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm,unmatched"
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
139 echo "R mutation analysis"
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
140 Rscript $dir/mutation_analysis.r $outdir/merged.txt $classes $outdir ${include_fr1} 2>&1
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
141
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
142
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
143 echo "---------------- mutation_analysis.py ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
144 echo "---------------- mutation_analysis.py ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
145
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
146 python $dir/mutation_analysis.py --input $outdir/merged.txt --genes $classes --includefr1 "${include_fr1}" --output $outdir/hotspot_analysis.txt
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
147
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
148 echo "---------------- aa_histogram.r ----------------"
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
149 echo "---------------- aa_histogram.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
150
104
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
151 Rscript $dir/aa_histogram.r $outdir/aa_mutations.txt $outdir/aa_histogram.png "" 2>&1
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
152
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
153 echo "---------------- aa_histogram.r ca ----------------"
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
154 echo "---------------- aa_histogram.r ca ----------------<br />" >> $log
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
155
104
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
156 Rscript $dir/aa_histogram.r $outdir/aa_mutations_ca.txt $outdir/aa_histogram_ca.png "ca" 2>&1
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
157
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
158 echo "---------------- aa_histogram.r cg ----------------"
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
159 echo "---------------- aa_histogram.r cg ----------------<br />" >> $log
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
160
104
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
161 Rscript $dir/aa_histogram.r $outdir/aa_mutations_cg.txt $outdir/aa_histogram_cg.png "cg" 2>&1
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
162
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
163 echo "---------------- aa_histogram.r cm ----------------"
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
164 echo "---------------- aa_histogram.r cm ----------------<br />" >> $log
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
165
104
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
166 Rscript $dir/aa_histogram.r $outdir/aa_mutations_cm.txt $outdir/aa_histogram_cm.png "cm" 2>&1
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
167
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
168 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
169
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
170 funcs=(sum mean median)
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
171
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
172 echo "---------------- sequence_overview.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
173 echo "---------------- sequence_overview.r ----------------<br />" >> $log
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
174
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
175 mkdir $outdir/sequence_overview
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
176
90
f0e8dac22c6e Uploaded
davidvanzessen
parents: 89
diff changeset
177 #Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
100
ff5be711382b Uploaded
davidvanzessen
parents: 99
diff changeset
178 Rscript $dir/sequence_overview.r $outdir/before_unique_filter.txt $outdir/merged.txt $outdir/sequence_overview $classes $outdir/hotspot_analysis_sum.txt 2>&1
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
179
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
180 echo "<table border='1'>" > $outdir/base_overview.html
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
181
92
b869a126e2c4 Uploaded
davidvanzessen
parents: 90
diff changeset
182 while IFS=$'\t' read ID class seq A C G T
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
183 do
85
07f7da724a77 Uploaded
davidvanzessen
parents: 84
diff changeset
184 echo "<tr><td>$ID</td><td>$seq</td><td>$class</td><td>$A</td><td>$C</td><td>$G</td><td>$T</td></tr>" >> $outdir/base_overview.html
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
185 done < $outdir/sequence_overview/ntoverview.txt
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
186
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
187 echo "<html><center><h1>$title</h1></center>" > $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
188
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
189 #display the matched/unmatched for clearity
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
190
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
191 matched_count="`cat $outdir/merged.txt | grep -v 'unmatched' | tail -n +2 | wc -l`"
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
192 unmatched_count="`cat $outdir/unmatched.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
193 total_count=$((matched_count + unmatched_count))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
194 perc_count=$((unmatched_count / total_count * 100))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
195 perc_count=`bc -l <<< "scale=2; ${unmatched_count} / ${total_count} * 100"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
196 perc_count=`bc -l <<< "scale=2; (${unmatched_count} / ${total_count} * 100 ) / 1"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
197
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
198 echo "<center><h2>Total: ${total_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
199 echo "<center><h2>Matched: ${matched_count} Unmatched: ${unmatched_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
200 echo "<center><h2>Percentage unmatched: ${perc_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
201
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
202 echo "---------------- main tables ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
203 echo "---------------- main tables ----------------<br />" >> $log
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
204 for func in ${funcs[@]}
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
205 do
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
206
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
207 echo "---------------- $func table ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
208 echo "---------------- $func table ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
209
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
210 cat $outdir/mutations_${func}.txt $outdir/hotspot_analysis_${func}.txt > $outdir/data_${func}.txt
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
211
98
5ffbf40cdd4b Uploaded
davidvanzessen
parents: 95
diff changeset
212 echo "<table border='1' width='100%'><caption><h3><a href='data_${func}.txt'>${func} table</a></h3></caption>" >> $output
58
8bb4d6009e08 Uploaded
davidvanzessen
parents: 55
diff changeset
213 echo "<tr><th>info</th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
214 for gene in ${genes[@]}
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
215 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
216 tmp=`cat $outdir/${gene}_${func}_n.txt`
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
217 echo "<th><a href='matched_${gene}_${func}.txt'>${gene} (N = $tmp)</a></th>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
218 done
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
219
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
220 tmp=`cat $outdir/unmatched_${func}_n.txt`
79
0513b46178c4 Uploaded
davidvanzessen
parents: 78
diff changeset
221 echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
222 tmp=`cat $outdir/all_${func}_n.txt`
89
480fdd383fdb Uploaded
davidvanzessen
parents: 85
diff changeset
223 echo "<th><a href='matched_all_${func}.txt'>all (N = $tmp)</a></th>" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
224
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
225 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
226 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
227 if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
228 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
229 else
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
230 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${unx}/${uny} (${unz}%)</td><td>${allx}/${ally} (${allz}%)</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
231 fi
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
232 done < $outdir/data_${func}.txt
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
233 echo "</table>" >> $output
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
234 #echo "<a href='data_${func}.txt'>Download data</a>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
235 done
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
236
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
237 echo "---------------- download links ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
238 echo "---------------- download links ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
239
94
e39176ccddc8 Uploaded
davidvanzessen
parents: 92
diff changeset
240
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
241 echo "<a href='unmatched.txt'>unmatched</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
242 echo "<a href='motif_per_seq.txt'>motif per sequence</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
243 echo "<a href='merged.txt'>all data</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
244 echo "<a href='mutation_by_id.txt'>mutations by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
245 echo "<a href='aa_id_mutations.txt'>AA mutations location by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
246 echo "<a href='absent_aa_id.txt'>Absant AA locations by id</a><br />" >> $output
77
c5c86d15cb94 Uploaded
davidvanzessen
parents: 76
diff changeset
247 echo "<a href='sequence_overview/index.html'>Sequence Overview</a><br />" >> $output
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
248 echo "<a href='base_overview.html'>Base overview</a><br />" >> $output
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
249 echo "<a href='baseline.pdf'>Baseline PDF</a><br />" >> $output
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
250 echo "<a href='baseline.txt'>Baseline Table</a><br />" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
251 echo "<a href='baseline_ca.pdf'>Baseline ca PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
252 echo "<a href='baseline_ca.txt'>Baseline ca Table</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
253 echo "<a href='baseline_cg.pdf'>Baseline cg PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
254 echo "<a href='baseline_cg.txt'>Baseline cg Table</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
255 echo "<a href='baseline_cm.pdf'>Baseline cm PDF</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
256 echo "<a href='baseline_cm.txt'>Baseline cm Table</a><br />" >> $output
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
257 echo "<a href='IgAT.zip'>IgAT zip</a><br />" >> $output
99
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
258 echo "<a href='IgAT_ca.zip'>IgAT ca zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
259 echo "<a href='IgAT_cg.zip'>IgAT cg zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
260 echo "<a href='IgAT_cm.zip'>IgAT cm zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
261 echo "<a href='new_IMGT.txz'>Filtered IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
262 echo "<a href='new_IMGT_ca.txz'>Filtered ca IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
263 echo "<a href='new_IMGT_cg.txz'>Filtered cg IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
264 echo "<a href='new_IMGT_cm.txz'>Filtered cm IMGT zip</a><br />" >> $output
86206431cbb0 Uploaded
davidvanzessen
parents: 98
diff changeset
265
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
266
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
267 echo "---------------- images ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
268 echo "---------------- images ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
269
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
270 echo "<img src='all.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
271 echo "<a href='all.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
272 if [ -a $outdir/ca.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
273 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
274 echo "<img src='ca.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
275 echo "<a href='ca.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
276 fi
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
277 if [ -a $outdir/cg.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
278 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
279 echo "<img src='cg.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
280 echo "<a href='cg.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
281 fi
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
282 if [ -a $outdir/scatter.png ]
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
283 then
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
284 echo "<img src='scatter.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
285 echo "<a href='scatter.txt'>download data</a><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
286 fi
49
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
287 if [ -a $outdir/frequency_ranges.png ]
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
288 then
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
289 echo "<img src='frequency_ranges.png'/><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
290 echo "<a href='frequency_ranges_classes.txt'>download class data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
291 echo "<a href='frequency_ranges_subclasses.txt'>download subclass data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
292 fi
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
293 if [ -a $outdir/aa_histogram.png ]
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
294 then
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
295 echo "<img src='aa_histogram.png'/><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
296 echo "<a href='aa_histogram.txt'>download data</a><br />" >> $output
104
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
297 echo "<img src='aa_histogram_ca.png'/><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
298 echo "<a href='aa_histogram_ca.txt'>download data</a><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
299 echo "<img src='aa_histogram_cg.png'/><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
300 echo "<a href='aa_histogram_cg.txt'>download data</a><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
301 echo "<img src='aa_histogram_cm.png'/><br />" >> $output
603a10976e9c Uploaded
davidvanzessen
parents: 102
diff changeset
302 echo "<a href='aa_histogram_cm.txt'>download data</a><br />" >> $output
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
303 fi
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
304
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
305 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
306 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
307 echo "<table border='1'><caption>$gene transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
308 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
309 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
310 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
311 done < $outdir/transitions_${gene}_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
312 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
313 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
314
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
315 echo "<table border='1'><caption>All transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
316 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
317 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
318 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
319 done < $outdir/transitions_all_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
320 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
321
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
322 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
323
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
324 echo "---------------- baseline ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
325 echo "---------------- baseline ----------------<br />" >> $log
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
326 tmp="$PWD"
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
327
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
328 mkdir $outdir/baseline
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
329
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
330
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
331 mkdir $outdir/baseline/ca_cg_cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
332 if [[ $(wc -l < $outdir/new_IMGT/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
333 cd $outdir/baseline/ca_cg_cm
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
334 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT.txz "ca_cg_cm" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline.pdf" "Sequence.ID" "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
335 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
336 echo "No sequences" > "$outdir/baseline.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
337 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
338
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
339 mkdir $outdir/baseline/ca
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
340 if [[ $(wc -l < $outdir/new_IMGT_ca/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
341 cd $outdir/baseline/ca
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
342 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_ca.txz "ca" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_ca.pdf" "Sequence.ID" "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
343 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
344 echo "No ca sequences" > "$outdir/baseline_ca.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
345 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
346
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
347 mkdir $outdir/baseline/cg
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
348 if [[ $(wc -l < $outdir/new_IMGT_cg/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
349 cd $outdir/baseline/cg
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
350 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cg.txz "cg" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cg.pdf" "Sequence.ID" "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
351 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
352 echo "No cg sequences" > "$outdir/baseline_cg.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
353 fi
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
354
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
355 mkdir $outdir/baseline/cm
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
356 if [[ $(wc -l < $outdir/new_IMGT_cm/1_Summary.txt) -gt "1" ]]; then
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
357 cd $outdir/baseline/cm
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
358 bash $dir/tmp/baseline/wrapper.sh 1 1 1 1 0 0 "25:26:38:55:65:104:-" $outdir/new_IMGT_cm.txz "cm" "$dir/tmp/baseline/IMGT-reference-seqs-IGHV-2015-11-05.fa" "$outdir/baseline_cm.pdf" "Sequence.ID" "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
359 else
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
360 echo "No cm sequences" > "$outdir/baseline_cm.txt"
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
361 fi
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
362
101
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
363 cd $tmp
3cffb8a38bb1 Uploaded
davidvanzessen
parents: 100
diff changeset
364
82
564c4f6da203 Uploaded
davidvanzessen
parents: 81
diff changeset
365 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
366 echo "---------------- naive_output.r ----------------<br />" >> $log
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
367
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
368 if [[ "$naive_output" != "None" ]]
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
369 then
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
370 echo "---------------- imgt_loader.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
371 echo "---------------- imgt_loader.r ----------------<br />" >> $log
50
8ba6afa1247a Uploaded
davidvanzessen
parents: 49
diff changeset
372 #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output
80
a4c2ddeadec0 Uploaded
davidvanzessen
parents: 79
diff changeset
373 Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1
95
a66eb1c5374c Uploaded
davidvanzessen
parents: 94
diff changeset
374
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
375 echo "---------------- naive_output.r ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
376 echo "---------------- naive_output.r ----------------<br />" >> $log
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
377 Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
378 fi
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
379
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
380 echo "</table>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
381
105
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
382 mv $log $outdir/log.html
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
383
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
384 cp $outdir/index.html $log
e4957ad476a2 Uploaded
davidvanzessen
parents: 104
diff changeset
385
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
386 echo "---------------- Done! ----------------"
102
e6bc976760d4 Uploaded
davidvanzessen
parents: 101
diff changeset
387 echo "---------------- Done! ----------------<br />" >> $log
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
388