annotate wrapper.sh @ 81:a778156dad3d draft

Uploaded
author davidvanzessen
date Tue, 17 May 2016 04:17:38 -0400
parents a4c2ddeadec0
children 564c4f6da203
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
2 set -e
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
5 method=$2
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
6 output=$3
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
7 outdir=$4
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
8 title=$5
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
9 include_fr1=$6
34
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
10 functionality=$7
d436daae9d68 Uploaded
davidvanzessen
parents: 32
diff changeset
11 unique=$8
69
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
12 naive_output_ca=$9
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
13 naive_output_cg=${10}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
14 naive_output_cm=${11}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
15 filter_unique=${12}
7acdcd5c52ef Uploaded
davidvanzessen
parents: 66
diff changeset
16 class_filter=${13}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
17 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
19 echo "---------------- read parameters ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
20 echo "---------------- read parameters ----------------<br />" > $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
21
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
22 echo "unpacking IMGT file"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
23
35
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
24 type="`file $input`"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
25 if [[ "$type" == *"Zip archive"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
26 echo "Zip archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
27 echo "unzip $input -d $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
28 unzip $input -d $PWD/files/
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
29 elif [[ "$type" == *"XZ compressed data"* ]] ; then
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
30 echo "ZX archive"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
31 echo "tar -xJf $input -C $PWD/files/"
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
32 mkdir -p $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
33 tar -xJf $input -C $PWD/files/$title
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
34 fi
8dba36531e6e Uploaded
davidvanzessen
parents: 34
diff changeset
35
64
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
36 cat `find $PWD/files/ -name "1_*"` > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
37 cat `find $PWD/files/ -name "3_*"` > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
38 cat `find $PWD/files/ -name "5_*"` > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
39 cat `find $PWD/files/ -name "6_*"` > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
40 cat `find $PWD/files/ -name "7_*"` > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
41 cat `find $PWD/files/ -name "8_*"` > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
42 cat `find $PWD/files/ -name "10_*"` > $PWD/hotspots.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
43
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
44
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
45
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
46 #cat $PWD/files/*/1_* > $PWD/summary.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
47 #cat $PWD/files/*/3_* > $PWD/sequences.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
48 #cat $PWD/files/*/5_* > $PWD/aa.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
49 #cat $PWD/files/*/6_* > $PWD/junction.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
50 #cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
51 #cat $PWD/files/*/8_* > $PWD/mutationstats.txt
0fdd90f7c654 Uploaded
davidvanzessen
parents: 63
diff changeset
52 #cat $PWD/files/*/10_* > $PWD/hotspots.txt
3
a0b27058dcac Uploaded
davidvanzessen
parents: 2
diff changeset
53
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
54 #BLASTN_DIR="/home/galaxy/tmp/blast/ncbi-blast-2.2.30+/bin"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
55
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
56 echo "${BLASTN_DIR}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
57
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
58 echo "identification ($method)"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
59 echo "identification ($method)<br />" >> $output
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
60
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
61 echo "blast or custom"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
62
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
63 if [[ "${method}" == "custom" ]] ; then
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
64 echo "custom"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
65 python $dir/gene_identification.py --input $PWD/summary.txt --output $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
66 else
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
67 echo "blast"
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
68 ID_index=$(cat $PWD/summary.txt | grep -o -P ".+Sequence ID" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
69 ID_index=$((ID_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
70 sequence_index=$(cat $PWD/summary.txt | grep -o -P ".+\tSequence" | grep -o -P "\t" | wc -l)
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
71 sequence_index=$((sequence_index+1))
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
72
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
73 echo "$ID_index ${sequence_index}"
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
74
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
75 cat $PWD/summary.txt | tail -n+2 | cut -f ${ID_index},${sequence_index} | awk '{print ">" $1 "\n" $2}' > $PWD/sequences.fasta
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
76
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
77 echo -e "qseqid\tsseqid\tpident\tlength\tmismatch\tgapopen\tqstart\tqend\tsstart\tsend\tevalue\tbitscore" > $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
78 ${BLASTN_DIR}/blastn -task blastn -db $dir/subclass_definition.db -query $PWD/sequences.fasta -outfmt 6 >> $outdir/identified_genes.txt
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
79 fi
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
80
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
81 echo "---------------- merge_and_filter.r ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
82 echo "---------------- merge_and_filter.r ----------------<br />" >> $output
19
c518cf0d4adb Uploaded
davidvanzessen
parents: 16
diff changeset
83
66
88e0e7665086 Uploaded
davidvanzessen
parents: 64
diff changeset
84 Rscript $dir/merge_and_filter.r $PWD/summary.txt $PWD/sequences.txt $PWD/mutationanalysis.txt $PWD/mutationstats.txt $PWD/hotspots.txt $outdir/identified_genes.txt $outdir/merged.txt $outdir/unmatched.txt $method $functionality $unique ${filter_unique} ${class_filter}
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
85
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
86 echo "---------------- mutation_analysis.r ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
87 echo "---------------- mutation_analysis.r ----------------<br />" >> $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
88
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
89 genes="ca,ca1,ca2,cg,cg1,cg2,cg3,cg4,cm,unmatched"
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
90 echo "R mutation analysis"
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
91 Rscript $dir/mutation_analysis.r $outdir/merged.txt $genes $outdir ${include_fr1} 2>&1
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
92
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
93 #echo "." > $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
94 #exit 0
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
95
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
96
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
97
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
98 echo "---------------- mutation_analysis.py ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
99 echo "---------------- mutation_analysis.py ----------------<br />" >> $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
100
32
2a7343e4be5a Uploaded
davidvanzessen
parents: 31
diff changeset
101 python $dir/mutation_analysis.py --input $outdir/merged.txt --genes $genes --includefr1 "${include_fr1}" --output $outdir/hotspot_analysis.txt
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
102
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
103 echo "---------------- aa_histogram.r ----------------"
63
a7381fd96dad Uploaded
davidvanzessen
parents: 62
diff changeset
104 echo "---------------- aa_histogram.r ----------------<br />" >> $output
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
105
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
106 Rscript $dir/aa_histogram.r $outdir/aa_mutations.txt $outdir/aa_histogram.png 2>&1
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
107
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
108 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
109
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
110 funcs=(sum mean median)
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
111
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
112
62
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
113 echo "<html><center><h1>$title</h1></center>" > $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
114
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
115 #display the matched/unmatched for clearity
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
116
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
117 matched_count="`cat $outdir/merged.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
118 unmatched_count="`cat $outdir/unmatched.txt | tail -n +2 | wc -l`"
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
119 total_count=$((matched_count + unmatched_count))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
120 perc_count=$((unmatched_count / total_count * 100))
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
121 perc_count=`bc -l <<< "scale=2; ${unmatched_count} / ${total_count} * 100"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
122 perc_count=`bc -l <<< "scale=2; (${unmatched_count} / ${total_count} * 100 ) / 1"`
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
123
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
124 echo "<center><h2>Total: ${total_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
125 echo "<center><h2>Matched: ${matched_count} Unmatched: ${unmatched_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
126 echo "<center><h2>Percentage unmatched: ${perc_count}</h2></center>" >> $output
4262e880472d Uploaded
davidvanzessen
parents: 58
diff changeset
127
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
128 echo "---------------- main tables ----------------"
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
129 for func in ${funcs[@]}
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
130 do
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
131
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
132 echo "---------------- $func table ----------------"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
133
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
134 cat $outdir/mutations_${func}.txt $outdir/hotspot_analysis_${func}.txt > $outdir/result.txt
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
135
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
136 echo "<table border='1' width='100%'><caption><h3>${func} table</h3></caption>" >> $output
58
8bb4d6009e08 Uploaded
davidvanzessen
parents: 55
diff changeset
137 echo "<tr><th>info</th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
138 for gene in ${genes[@]}
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
139 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
140 tmp=`cat $outdir/${gene}_${func}_n.txt`
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
141 echo "<th><a href='matched_${gene}_${func}.txt'>${gene} (N = $tmp)</a></th>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
142 done
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
143
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
144 tmp=`cat $outdir/unmatched_${func}_n.txt`
79
0513b46178c4 Uploaded
davidvanzessen
parents: 78
diff changeset
145 echo "<th><a href='unmatched.txt'>unmatched (N = ${unmatched_count})</a></th>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
146 tmp=`cat $outdir/all_${func}_n.txt`
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
147 echo "<th><a href='matched_${func}_all.txt'>all (N = $tmp)</a></th>" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
148
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
149 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz unx uny unz allx ally allz
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
150 do
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
151 if [ "$name" == "FR S/R (ratio)" ] || [ "$name" == "CDR S/R (ratio)" ] ; then #meh
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
152 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz})</td><td>${ca1x}/${ca1y} (${ca1z})</td><td>${ca2x}/${ca2y} (${ca2z})</td><td>${cgx}/${cgy} (${cgz})</td><td>${cg1x}/${cg1y} (${cg1z})</td><td>${cg2x}/${cg2y} (${cg2z})</td><td>${cg3x}/${cg3y} (${cg3z})</td><td>${cg4x}/${cg4y} (${cg4z})</td><td>${cmx}/${cmy} (${cmz})</td><td>${allx}/${ally} (${allz})</td></tr>" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
153 else
78
b523ce95d857 Uploaded
davidvanzessen
parents: 77
diff changeset
154 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${unx}/${uny} (${unz}%)</td><td>${allx}/${ally} (${allz}%)</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
155 fi
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
156 done < $outdir/result.txt
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
157
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
158 done
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
159
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
160 echo "---------------- download links ----------------"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
161
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
162 echo "</table>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
163 echo "<a href='unmatched.txt'>unmatched</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
164 echo "<a href='motif_per_seq.txt'>motif per sequence</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
165 echo "<a href='merged.txt'>all data</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
166 echo "<a href='mutation_by_id.txt'>mutations by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
167 echo "<a href='aa_id_mutations.txt'>AA mutations location by id</a><br />" >> $output
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
168 echo "<a href='absent_aa_id.txt'>Absant AA locations by id</a><br />" >> $output
77
c5c86d15cb94 Uploaded
davidvanzessen
parents: 76
diff changeset
169 echo "<a href='sequence_overview/index.html'>Sequence Overview</a><br />" >> $output
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
170 echo "<a href='base_overview.html'>Base overview</a><br />" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
171
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
172 echo "---------------- images ----------------"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
173
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
174 echo "<img src='all.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
175 echo "<a href='all.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
176 if [ -a $outdir/ca.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
177 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
178 echo "<img src='ca.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
179 echo "<a href='ca.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
180 fi
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
181 if [ -a $outdir/cg.png ]
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
182 then
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
183 echo "<img src='cg.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
184 echo "<a href='cg.txt'>download data</a><br />" >> $output
4
069419cccba4 Uploaded
davidvanzessen
parents: 3
diff changeset
185 fi
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
186 if [ -a $outdir/scatter.png ]
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
187 then
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
188 echo "<img src='scatter.png'/><br />" >> $output
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
189 echo "<a href='scatter.txt'>download data</a><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
190 fi
49
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
191 if [ -a $outdir/frequency_ranges.png ]
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
192 then
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
193 echo "<img src='frequency_ranges.png'/><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
194 echo "<a href='frequency_ranges_classes.txt'>download class data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
195 echo "<a href='frequency_ranges_subclasses.txt'>download subclass data</a><br />" >> $output
5c6b9e99d576 Uploaded
davidvanzessen
parents: 47
diff changeset
196 fi
26
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
197 if [ -a $outdir/aa_histogram.png ]
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
198 then
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
199 echo "<img src='aa_histogram.png'/><br />" >> $output
2433a1e110e1 Uploaded
davidvanzessen
parents: 25
diff changeset
200 echo "<a href='aa_histogram.txt'>download data</a><br />" >> $output
22
d84c9791d8c4 Uploaded
davidvanzessen
parents: 21
diff changeset
201 fi
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
202
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
203 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
204 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
205 echo "<table border='1'><caption>$gene transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
206 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
207 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
208 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
209 done < $outdir/transitions_${gene}_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
210 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
211 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
212
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
213 echo "<table border='1'><caption>All transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
214 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
215 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
216 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
53
7290a88ea202 Uploaded
davidvanzessen
parents: 52
diff changeset
217 done < $outdir/transitions_all_sum.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
218 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
219
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
220 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
221
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
222
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
223 #optional output for naive
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
224
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
225 echo "---------------- aa_histogram.r ----------------"
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
226
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
227 if [[ "$naive_output" != "None" ]]
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
228 then
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
229 echo "---------------- imgt_loader.r ----------------"
50
8ba6afa1247a Uploaded
davidvanzessen
parents: 49
diff changeset
230 #python $dir/imgt_loader.py --summ $PWD/summary.txt --aa $PWD/aa.txt --junction $PWD/junction.txt --output $naive_output
80
a4c2ddeadec0 Uploaded
davidvanzessen
parents: 79
diff changeset
231 Rscript --verbose $dir/imgt_loader.r $PWD/summary.txt $PWD/aa.txt $PWD/junction.txt $outdir/loader_output.txt 2>&1
55
0d5add1a9800 Uploaded
davidvanzessen
parents: 54
diff changeset
232 echo "---------------- naive_output.r ----------------"
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
233 Rscript $dir/naive_output.r $outdir/loader_output.txt $outdir/merged.txt ${naive_output_ca} ${naive_output_cg} ${naive_output_cm} $outdir/ntoverview.txt $outdir/ntsum.txt 2>&1
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
234 fi
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
235
76
becea91089ed Uploaded
davidvanzessen
parents: 69
diff changeset
236 echo "---------------- sequence_overview.r ----------------"
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
237
76
becea91089ed Uploaded
davidvanzessen
parents: 69
diff changeset
238 mkdir $outdir/sequence_overview
becea91089ed Uploaded
davidvanzessen
parents: 69
diff changeset
239
becea91089ed Uploaded
davidvanzessen
parents: 69
diff changeset
240 Rscript $dir/sequence_overview.r $outdir/identified_genes.txt $PWD/sequences.txt $outdir/sequence_overview 2>&1
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
241
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
242 echo "<table border='1'>" > $outdir/base_overview.html
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
243
81
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
244 while read ID class seq A C G T
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
245 do
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
246 echo "<tr><td>$ID</td><td>$class</td><td>$A</td><td>$C</td><td>$G</td><td>$T</td></tr>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
247 done < $outdir/sequence_overview/ntoverview.txt
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
248
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
249 echo "</table>" >> $outdir/base_overview.html
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
250
a778156dad3d Uploaded
davidvanzessen
parents: 80
diff changeset
251 echo "---------------- Done! ----------------"
47
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
252
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
253
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
254
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
255
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
256
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
257
099cc1254f74 Uploaded
davidvanzessen
parents: 43
diff changeset
258
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
259 #rm $outdir/HS12RSS.txt
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
260 #rm $outdir/HS23RSS.txt