annotate wrapper.sh @ 0:74d2bc479bee draft

Uploaded
author davidvanzessen
date Mon, 18 Aug 2014 04:04:37 -0400
parents
children 856b5b718d21
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
2 dir="$(cd "$(dirname "$0")" && pwd)"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 input=$1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
5 output=$2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
6 outdir=$3
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
7 mkdir $outdir
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
8
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
9 unzip $input -d $PWD/files/ > $PWD/unziplog.log
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
10 cat $PWD/files/*/1_* > $PWD/summary.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
11 cat $PWD/files/*/7_* > $PWD/mutationanalysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
12 cat $PWD/files/*/8_* > $PWD/mutationstats.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
13 cat $PWD/files/*/10_* > $PWD/hotspots.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
14
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
15 mkdir $outdir/identification/
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
16 python $dir/gene_identification.py --input $PWD/summary.txt --outdir $outdir/identification/
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
17 genes=(ca ca1 ca2 cg cg1 cg2 cg3 cg4 cm)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18 tmp=$PWD/tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19 tmp2=$PWD/tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
20 hotspottmp=$PWD/hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
21 mutationtmp=$PWD/mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
22 touch $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
23 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
24 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
25 echo "Running $gene <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
26 mkdir $outdir/$gene
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
27 echo "Filtering input..." >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
28 Rscript $dir/filter.r $PWD/summary.txt $outdir/identification/${gene}.txt $outdir/$gene/summary.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
29 Rscript $dir/filter.r $PWD/mutationanalysis.txt $outdir/identification/${gene}.txt $outdir/$gene/mutationanalysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
30 Rscript $dir/filter.r $PWD/mutationstats.txt $outdir/identification/${gene}.txt $outdir/$gene/mutationstats.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
31 Rscript $dir/filter.r $PWD/hotspots.txt $outdir/identification/${gene}.txt $outdir/$gene/hotspots.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
32 echo "done <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
33
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
34 echo "Running R script on $gene..." >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
35 Rscript --verbose $dir/mutation_analysis.r $outdir/$gene/mutationstats.txt $outdir/$gene/summary.txt $outdir/$gene/ 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
36 echo "done <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
37
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
38 echo "Running Python script..." >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
39 python $dir/mutation_analysis.py --mutationfile $outdir/$gene/mutationanalysis.txt --hotspotfile $outdir/$gene/hotspots.txt --output $outdir/$gene/hotspot_analysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
40 echo "done <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
41 echo "Done with $gene <br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
42 cut $outdir/$gene/mutations.txt -d, -f2,3,4 > $mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
43 cut $outdir/$gene/hotspot_analysis.txt -d, -f2,3,4 > $hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
44 cat $mutationtmp $hotspottmp > $tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
45 paste $outdir/mutationandhotspot.txt -d, $tmp > $tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
46 cat $tmp2 > $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
47 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
48
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
49 Rscript --verbose $dir/mutation_analysis.r $PWD/mutationstats.txt $PWD/summary.txt $outdir/ 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
50 python $dir/mutation_analysis.py --mutationfile $PWD/mutationanalysis.txt --hotspotfile $PWD/hotspots.txt --output $outdir/hotspot_analysis.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
51
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
52 cut $outdir/mutations.txt -d, -f2,3,4 > $mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
53 cut $outdir/hotspot_analysis.txt -d, -f2,3,4 > $hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
54 cat $mutationtmp $hotspottmp > $tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
55 paste $outdir/mutationandhotspot.txt -d, $tmp > $tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
56 cat $tmp2 > $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
57
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
58 cut $outdir/ca1/mutations.txt -d, -f1 > $mutationtmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
59 cut $outdir/ca1/hotspot_analysis.txt -d, -f1 > $hotspottmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
60 cat $mutationtmp $hotspottmp > $tmp
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
61 paste $tmp $outdir/mutationandhotspot.txt -d, > $tmp2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
62 cat $tmp2 | tr -s "," > $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
63
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
64 ca_n=`cat $outdir/ca/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
65 ca1_n=`cat $outdir/ca1/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
66 ca2_n=`cat $outdir/ca2/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
67 cg_n=`cat $outdir/cg/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
68 cg1_n=`cat $outdir/cg1/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
69 cg2_n=`cat $outdir/cg2/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
70 cg3_n=`cat $outdir/cg3/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
71 cg4_n=`cat $outdir/cg4/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
72 cm_n=`cat $outdir/cm/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
73 #all_n=$((ca_n + cg_n + cm_n))
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
74 all_n=`cat $outdir/n.txt`
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
75
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
76
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
77 echo "<html><table border='1'>" > $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
78 echo "<tr><th>info</th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
79 echo "<th><a href='identification/ca.txt'>ca (N = $ca_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
80 echo "<th><a href='identification/ca1.txt'>ca1 (N = $ca1_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
81 echo "<th><a href='identification/ca2.txt'>ca2 (N = $ca2_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
82 echo "<th><a href='identification/cg.txt'>cg (N = $cg_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
83 echo "<th><a href='identification/cg1.txt'>cg1 (N = $cg1_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
84 echo "<th><a href='identification/cg2.txt'>cg2 (N = $cg2_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
85 echo "<th><a href='identification/cg3.txt'>cg3 (N = $cg3_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
86 echo "<th><a href='identification/cg4.txt'>cg4 (N = $cg4_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
87 echo "<th><a href='identification/cm.txt'>cm (N = $cm_n)</a></th>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
88 echo "<th>all (N = $all_n)</th></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
89 while IFS=, read name cax cay caz ca1x ca1y ca1z ca2x ca2y ca2z cgx cgy cgz cg1x cg1y cg1z cg2x cg2y cg2z cg3x cg3y cg3z cg4x cg4y cg4z cmx cmy cmz allx ally allz
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
90 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
91 echo "<tr><td>$name</td><td>${cax}/${cay} (${caz}%)</td><td>${ca1x}/${ca1y} (${ca1z}%)</td><td>${ca2x}/${ca2y} (${ca2z}%)</td><td>${cgx}/${cgy} (${cgz}%)</td><td>${cg1x}/${cg1y} (${cg1z}%)</td><td>${cg2x}/${cg2y} (${cg2z}%)</td><td>${cg3x}/${cg3y} (${cg3z}%)</td><td>${cg4x}/${cg4y} (${cg4z}%)</td><td>${cmx}/${cmy} (${cmz}%)</td><td>${allx}/${ally} (${allz}%)</td></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
92 done < $outdir/mutationandhotspot.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
93 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
94 echo "<a href='identification/unmatched.txt'>umatched</a><br />" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
95
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
96 Rscript $dir/piechart.r "${ca_n},${cg_n},${cm_n}" "IgA - ${ca_n},IgG - ${cg_n},IgM? - ${cm_n}" "Ig* (N = $all_n)" $outdir/all.png 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
97 Rscript $dir/piechart.r "${ca1_n},${ca2_n}" "IgA1 - ${ca1_n},IgA2 - ${ca2_n}" "IgA (N = $ca_n)" $outdir/ca.png 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
98 Rscript $dir/piechart.r "${cg1_n},${cg2_n},${cg3_n},${cg4_n}" "IgG1 - ${cg1_n},IgG2 - ${cg2_n},IgG3 - ${cg3_n},IgG4 - ${cg4_n}" "IgG (N = $cg_n)" $outdir/cg.png 2>&1
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
99
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
100 echo "<img src='all.png'/>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
101 echo "<img src='ca.png'/>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
102 echo "<img src='cg.png'/>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
103
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
104 for gene in ${genes[@]}
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
105 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
106 echo "<table border='1'><caption>$gene transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
107 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
108 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
109 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
110 done < $outdir/$gene/transitions.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
111 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
112 done
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
113
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
114 echo "<table border='1'><caption>All transition table</caption>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
115 while IFS=, read from a c g t
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
116 do
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
117 echo "<tr><td>$from</td><td>$a</td><td>$c</td><td>$g</td><td>$t</td></tr>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
118 done < $outdir/transitions.txt
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
119 echo "</table>" >> $output
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
120
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
121 echo "</html>" >> $output