annotate wrapper.sh @ 2:2f4298673519 draft

Uploaded
author davidvanzessen
date Wed, 10 Sep 2014 10:33:29 -0400
parents 856b5b718d21
children a0b27058dcac
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
2 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
5 output=$2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
6 outdir=$3
1
856b5b718d21 Uploaded
davidvanzessen
parents: 0
diff changeset
7 title=$4
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
8 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
9
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
10 unzip $input -d $PWD/files/ > $PWD/unziplog.log
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
11 cat $PWD/files/*/1_* > $PWD/summary.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
12 cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
13 cat $PWD/files/*/8_* > $PWD/mutationstats.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
14 cat $PWD/files/*/10_* > $PWD/hotspots.txt
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
15 cp $dir/HS12RSS.txt $outdir/
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
16 cp $dir/HS23RSS.txt $outdir/
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
17
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18 mkdir $outdir/identification/
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19 python $dir/gene_identification.py --input $PWD/summary.txt --outdir $outdir/identification/
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
20 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
21 tmp=$PWD/tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
22 tmp2=$PWD/tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
23 hotspottmp=$PWD/hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
24 mutationtmp=$PWD/mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
25 touch $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
26 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
27 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
28 echo "Running $gene <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
29 mkdir $outdir/$gene
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
30 cp $dir/HS12RSS.txt $outdir/$gene/
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
31 cp $dir/HS23RSS.txt $outdir/$gene/
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
32 echo "Filtering input..." >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
33 Rscript $dir/filter.r $PWD/summary.txt $outdir/identification/${gene}.txt $outdir/$gene/summary.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
34 Rscript $dir/filter.r $PWD/mutationanalysis.txt $outdir/identification/${gene}.txt $outdir/$gene/mutationanalysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
35 Rscript $dir/filter.r $PWD/mutationstats.txt $outdir/identification/${gene}.txt $outdir/$gene/mutationstats.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
36 Rscript $dir/filter.r $PWD/hotspots.txt $outdir/identification/${gene}.txt $outdir/$gene/hotspots.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
37 echo "done <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
38
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
39 echo "Running R script on $gene..." >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
40 Rscript --verbose $dir/mutation_analysis.r $outdir/$gene/mutationstats.txt $outdir/$gene/summary.txt $outdir/$gene/ 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
41 echo "done <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
42
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
43 echo "Running Python script..." >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
44 python $dir/mutation_analysis.py --mutationfile $outdir/$gene/mutationanalysis.txt --hotspotfile $outdir/$gene/hotspots.txt --output $outdir/$gene/hotspot_analysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
45 echo "done <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
46 echo "Done with $gene <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
47 cut $outdir/$gene/mutations.txt -d, -f2,3,4 > $mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
48 cut $outdir/$gene/hotspot_analysis.txt -d, -f2,3,4 > $hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
49 cat $mutationtmp $hotspottmp > $tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
50 paste $outdir/mutationandhotspot.txt -d, $tmp > $tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
51 cat $tmp2 > $outdir/mutationandhotspot.txt
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
52 rm $outdir/$gene/HS12RSS.txt
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
53 rm $outdir/$gene/HS23RSS.txt
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
54 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
55
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
56 Rscript --verbose $dir/mutation_analysis.r $PWD/mutationstats.txt $PWD/summary.txt $outdir/ 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
57 python $dir/mutation_analysis.py --mutationfile $PWD/mutationanalysis.txt --hotspotfile $PWD/hotspots.txt --output $outdir/hotspot_analysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
58
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
59 cut $outdir/mutations.txt -d, -f2,3,4 > $mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
60 cut $outdir/hotspot_analysis.txt -d, -f2,3,4 > $hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
61 cat $mutationtmp $hotspottmp > $tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
62 paste $outdir/mutationandhotspot.txt -d, $tmp > $tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
63 cat $tmp2 > $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
64
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
65 cut $outdir/ca1/mutations.txt -d, -f1 > $mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
66 cut $outdir/ca1/hotspot_analysis.txt -d, -f1 > $hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
67 cat $mutationtmp $hotspottmp > $tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
68 paste $tmp $outdir/mutationandhotspot.txt -d, > $tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
69 cat $tmp2 | tr -s "," > $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
70
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
71 ca_n=`cat $outdir/ca/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
72 ca1_n=`cat $outdir/ca1/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
73 ca2_n=`cat $outdir/ca2/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
74 cg_n=`cat $outdir/cg/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
75 cg1_n=`cat $outdir/cg1/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
76 cg2_n=`cat $outdir/cg2/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
77 cg3_n=`cat $outdir/cg3/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
78 cg4_n=`cat $outdir/cg4/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
79 cm_n=`cat $outdir/cm/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
80 #all_n=$((ca_n + cg_n + cm_n))
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
81 all_n=`cat $outdir/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
82
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
83
1
856b5b718d21 Uploaded
davidvanzessen
parents: 0
diff changeset
84 echo "<html><center><h1>$title</h1></center><table border='1'>" > $output
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
85 echo "<tr><th>info</th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
86 echo "<th><a href='identification/ca.txt'>ca (N = $ca_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
87 echo "<th><a href='identification/ca1.txt'>ca1 (N = $ca1_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
88 echo "<th><a href='identification/ca2.txt'>ca2 (N = $ca2_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
89 echo "<th><a href='identification/cg.txt'>cg (N = $cg_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
90 echo "<th><a href='identification/cg1.txt'>cg1 (N = $cg1_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
91 echo "<th><a href='identification/cg2.txt'>cg2 (N = $cg2_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
92 echo "<th><a href='identification/cg3.txt'>cg3 (N = $cg3_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
93 echo "<th><a href='identification/cg4.txt'>cg4 (N = $cg4_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
94 echo "<th><a href='identification/cm.txt'>cm (N = $cm_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
95 echo "<th>all (N = $all_n)</th></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
96 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz allx ally allz
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
97 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
98 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${allx}/${ally} (${allz}%)</td></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
99 done < $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
100 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
101 echo "<a href='identification/unmatched.txt'>umatched</a><br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
102
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
103 Rscript $dir/piechart.r "${ca_n},${cg_n},${cm_n}" "IgA - ${ca_n},IgG - ${cg_n},IgM? - ${cm_n}" "Ig* (N = $all_n)" $outdir/all.png 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
104 Rscript $dir/piechart.r "${ca1_n},${ca2_n}" "IgA1 - ${ca1_n},IgA2 - ${ca2_n}" "IgA (N = $ca_n)" $outdir/ca.png 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
105 Rscript $dir/piechart.r "${cg1_n},${cg2_n},${cg3_n},${cg4_n}" "IgG1 - ${cg1_n},IgG2 - ${cg2_n},IgG3 - ${cg3_n},IgG4 - ${cg4_n}" "IgG (N = $cg_n)" $outdir/cg.png 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
106
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
107 $dir/seqlogo -t "HS12RSS" -w 20 -h 5 -p -a -c -n -F PNG -f $outdir/weblogo_in_rs12.txt > $outdir/HS12.png 2>&1
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
108 $dir/seqlogo -t "HS23RSS" -w 20 -h 5 -p -a -c -n -F PNG -f $outdir/weblogo_in_rs23.txt > $outdir/HS23.png 2>&1
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
109
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
110
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
111 echo "<img src='all.png'/>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
112 echo "<img src='ca.png'/>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
113 echo "<img src='cg.png'/>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
114
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
115 echo "<img src='HS12.png'/>" >> $output
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
116 echo "<img src='HS23.png'/>" >> $output
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
117
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
118 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
119 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
120 echo "<table border='1'><caption>$gene transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
121 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
122 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
123 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
124 done < $outdir/$gene/transitions.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
125 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
126 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
127
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
128 echo "<table border='1'><caption>All transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
129 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
130 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
131 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
132 done < $outdir/transitions.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
133 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
134
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
135 echo "</html>" >> $output
2
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
136
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
137 #rm $outdir/HS12RSS.txt
2f4298673519 Uploaded
davidvanzessen
parents: 1
diff changeset
138 #rm $outdir/HS23RSS.txt