annotate combined.sh @ 3:6364030a16b8 draft

Uploaded
author davidvanzessen
date Fri, 24 Jan 2014 04:02:33 -0500
parents 364b169ffb30
children 2f2544607ad6
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
2
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
3 clonalType=${@:(-3):1}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
4 html=${@:(-2):1}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
5 imageDir=${@:(-1):1}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
6 dataCount=`expr $# - 3`
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
7 inputData=${@:(1):dataCount}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
8 dir="$(cd "$(dirname "$0")" && pwd)"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
9 array=("$@")
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
10 echo "<html><h3>Progress</h3><table><tr><td>info</td></tr>" > $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
11 echo "<tr><td>-----------------------------------</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
12
3
6364030a16b8 Uploaded
davidvanzessen
parents: 2
diff changeset
13 mkdir $PWD/igblastdatabase
6364030a16b8 Uploaded
davidvanzessen
parents: 2
diff changeset
14 unzip $dir/database.zip -d $PWD/igblastdatabase/
6364030a16b8 Uploaded
davidvanzessen
parents: 2
diff changeset
15 export IGDATA=$PWD/igblastdatabase/
1
7b0d9c107680 Uploaded
davidvanzessen
parents: 0
diff changeset
16
0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
17 function blastAndParse {
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
18 echo "<tr><td>Starting blast of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
19 echo "$IGDATA/bin/igblastn -germline_db_V $IGDATA/database/human_gl_V -germline_db_J $IGDATA/database/human_gl_J -germline_db_D $IGDATA/database/human_gl_D -domain_system imgt -query $1 -auxiliary_data $IGDATA/optional_file/human_gl.aux -show_translation -outfmt 3 > $PWD/$4"
2
364b169ffb30 Uploaded
davidvanzessen
parents: 1
diff changeset
20 igblastn -germline_db_V $PWD/igblastdatabase/database/human_gl_V -germline_db_J $PWD/igblastdatabase/database/human_gl_J -germline_db_D $PWD/igblastdatabase/database/human_gl_D -domain_system imgt -query $1 -auxiliary_data $PWD/igblastdatabase/optional_file/human_gl.aux -show_translation -outfmt 3 > $PWD/$4
0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
21 echo "<tr><td>Finished blast of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
22
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
23 echo "<tr><td>Starting parse of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
24 perl $dir/igparse.pl $PWD/$4 0 | grep -v "D:" | cut -f2- > $5
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
25 echo "<tr><td>Finished parse of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
26 }
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
27
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
28 id=${inputData[0]}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
29 forwardSlash="/"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
30 mergerInput=()
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
31 count=0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
32 for current in $inputData; do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
33 if [[ "$current" != *"$forwardSlash"* ]]; then
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
34 id=$current
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
35 count=0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
36 mergerInput+=($id)
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
37 continue
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
38 fi
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
39 fileName=$(basename $current)
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
40 parsedFileName="${fileName%.*}"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
41 parsedFileName="$PWD/$parsedFileName.parsed"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
42 blastAndParse $current $id $count $fileName $parsedFileName &
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
43 mergerInput+=($parsedFileName)
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
44 count=$((count+1))
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
45 done
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
46 wait
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
47
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
48
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
49
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
50 echo "<tr><td>-----------------------------------</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
51 echo "<tr><td>merging</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
52
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
53 python $dir/igblastmerge.py ${mergerInput[*]} --output $PWD/merged.txt
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
54
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
55 echo "<tr><td>done</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
56 echo "<tr><td>-----------------------------------</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
57 echo "<tr><td>plotting</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
58
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
59
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
60 inputFile=$PWD/merged.txt
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
61 outputFile=$html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
62 outputDir=$imageDir
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
63 mkdir $outputDir
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
64 Rscript --verbose $dir/RScript.r $inputFile $outputDir $outputDir $clonalType 2>&1
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
65 echo "<html>" > $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
66 echo "<img src='VPlot.png'/>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
67 echo "<img src='DPlot.png'/>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
68 echo "<img src='JPlot.png'/>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
69
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
70 samples=`cat $outputDir/samples.txt`
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
71 count=1
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
72 echo "<table border='1'><caption><a href='allUnique.tsv'><h3>$clonalType</h3></a></caption>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
73 hasReplicateColumn="$(if head -n 1 $inputFile | grep -q 'Replicate'; then echo 'Yes'; else echo 'No'; fi)"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
74 for sample in $samples; do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
75 clonalityScore="$(cat $outputDir/ClonalityScore_$sample.csv)"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
76 echo "<tr><td colspan='3' height='100'></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
77 echo "<tr><td colspan='3'><h1>$sample</h1></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
78
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
79 echo "$hasReplicateColumn"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
80 #if its a 'new' merged file with replicate info
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
81 if [[ "$hasReplicateColumn" == "Yes" ]] ; then
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
82 echo "<tr><td colspan='3'><a href='clonality_$sample.tsv'><h2>Clonality Score: $clonalityScore</h2></a></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
83
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
84 #replicate,reads,squared
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
85 echo "<tr><td colspan='3'><table border='1'><tr><th>Replicate ID</th><th>Number of Reads</th><th>Reads Squared</th></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
86 while IFS=, read replicate reads squared
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
87 do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
88
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
89 echo "<tr><td><a href='clonality_${sample}_$replicate.tsv'>$replicate</a></td><td>$reads</td><td>$squared</td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
90 done < $outputDir/ReplicateReads_$sample.csv
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
91
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
92 #sum of reads and reads squared
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
93 while IFS=, read readsSum squaredSum
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
94 do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
95 echo "<tr><td>Sum</td><td>$readsSum</td><td>$squaredSum</td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
96 done < $outputDir/ReplicateSumReads_$sample.csv
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
97
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
98 echo "</table></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
99
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
100 #overview
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
101 echo "<tr><td colspan='3'><table border='1'><tr><th>Coincidence Type</th><th>Raw Coincidence Freq</th><th>Coincidence Weight</th><th>Coincidences, Weighted</th></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
102 while IFS=, read type count weight weightedCount
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
103 do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
104 echo "<tr><td>$type</td><td>$count</td><td>$weight</td><td>$weightedCount</td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
105 done < $outputDir/ClonalityOverView_$sample.csv
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
106 echo "</table></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
107 fi
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
108
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
109 echo "<tr><td><h2>V-D Heatmap:</h2></td><td><h2>V-J Heatmap:</h2></td><td><h2>D-J Heatmap:</h2></td></tr><tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
110 mv "$outputDir/HeatmapVD_$sample.png" "$outputDir/VD_$sample.png"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
111 echo "<td><img src='VD_$sample.png'/></td>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
112 mv "$outputDir/HeatmapVJ_$sample.png" "$outputDir/VJ_$sample.png"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
113 echo "<td><img src='VJ_$sample.png'/></td>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
114 mv "$outputDir/HeatmapDJ_$sample.png" "$outputDir/DJ_$sample.png"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
115 echo "<td><img src='DJ_$sample.png'/></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
116 count=$((count+1))
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
117 done
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
118 echo "</table>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
119
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
120 echo "</html>" >> $outputFile