annotate combined.sh @ 0:d52f6a986108 draft

Uploaded
author davidvanzessen
date Thu, 23 Jan 2014 08:22:28 -0500
parents
children 7b0d9c107680
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
1 #!/bin/bash
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
2
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
3 #export IGDATA=/home/david/tmp/ncbi-igblast-1.0.0;
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
4
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
5 clonalType=${@:(-3):1}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
6 html=${@:(-2):1}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
7 imageDir=${@:(-1):1}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
8 dataCount=`expr $# - 3`
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
9 inputData=${@:(1):dataCount}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
10 dir="$(cd "$(dirname "$0")" && pwd)"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
11 array=("$@")
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
12 echo "<html><h3>Progress</h3><table><tr><td>info</td></tr>" > $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
13 echo "<tr><td>-----------------------------------</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
14
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
15 function blastAndParse {
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
16 echo "<tr><td>Starting blast of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
17 echo "$IGDATA/bin/igblastn -germline_db_V $IGDATA/database/human_gl_V -germline_db_J $IGDATA/database/human_gl_J -germline_db_D $IGDATA/database/human_gl_D -domain_system imgt -query $1 -auxiliary_data $IGDATA/optional_file/human_gl.aux -show_translation -outfmt 3 > $PWD/$4"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
18 $IGDATA/bin/igblastn -germline_db_V $IGDATA/database/human_gl_V -germline_db_J $IGDATA/database/human_gl_J -germline_db_D $IGDATA/database/human_gl_D -domain_system imgt -query $1 -auxiliary_data $IGDATA/optional_file/human_gl.aux -show_translation -outfmt 3 > $PWD/$4
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
19 echo "<tr><td>Finished blast of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
20
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
21 echo "<tr><td>Starting parse of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
22 perl $dir/igparse.pl $PWD/$4 0 | grep -v "D:" | cut -f2- > $5
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
23 echo "<tr><td>Finished parse of sample $3 of patient $2</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
24 }
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
25
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
26 id=${inputData[0]}
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
27 forwardSlash="/"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
28 mergerInput=()
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
29 count=0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
30 for current in $inputData; do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
31 if [[ "$current" != *"$forwardSlash"* ]]; then
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
32 id=$current
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
33 count=0
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
34 mergerInput+=($id)
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
35 continue
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
36 fi
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
37 fileName=$(basename $current)
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
38 parsedFileName="${fileName%.*}"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
39 parsedFileName="$PWD/$parsedFileName.parsed"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
40 blastAndParse $current $id $count $fileName $parsedFileName &
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
41 mergerInput+=($parsedFileName)
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
42 count=$((count+1))
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
43 done
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
44 wait
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
45
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
46
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
47
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
48 echo "<tr><td>-----------------------------------</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
49 echo "<tr><td>merging</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
50
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
51 python $dir/igblastmerge.py ${mergerInput[*]} --output $PWD/merged.txt
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
52
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
53 echo "<tr><td>done</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
54 echo "<tr><td>-----------------------------------</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
55 echo "<tr><td>plotting</td></tr>" >> $html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
56
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
57
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
58 inputFile=$PWD/merged.txt
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
59 outputFile=$html
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
60 outputDir=$imageDir
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
61 mkdir $outputDir
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
62 Rscript --verbose $dir/RScript.r $inputFile $outputDir $outputDir $clonalType 2>&1
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
63 echo "<html>" > $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
64 echo "<img src='VPlot.png'/>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
65 echo "<img src='DPlot.png'/>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
66 echo "<img src='JPlot.png'/>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
67
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
68 samples=`cat $outputDir/samples.txt`
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
69 count=1
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
70 echo "<table border='1'><caption><a href='allUnique.tsv'><h3>$clonalType</h3></a></caption>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
71 hasReplicateColumn="$(if head -n 1 $inputFile | grep -q 'Replicate'; then echo 'Yes'; else echo 'No'; fi)"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
72 for sample in $samples; do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
73 clonalityScore="$(cat $outputDir/ClonalityScore_$sample.csv)"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
74 echo "<tr><td colspan='3' height='100'></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
75 echo "<tr><td colspan='3'><h1>$sample</h1></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
76
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
77 echo "$hasReplicateColumn"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
78 #if its a 'new' merged file with replicate info
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
79 if [[ "$hasReplicateColumn" == "Yes" ]] ; then
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
80 echo "<tr><td colspan='3'><a href='clonality_$sample.tsv'><h2>Clonality Score: $clonalityScore</h2></a></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
81
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
82 #replicate,reads,squared
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
83 echo "<tr><td colspan='3'><table border='1'><tr><th>Replicate ID</th><th>Number of Reads</th><th>Reads Squared</th></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
84 while IFS=, read replicate reads squared
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
85 do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
86
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
87 echo "<tr><td><a href='clonality_${sample}_$replicate.tsv'>$replicate</a></td><td>$reads</td><td>$squared</td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
88 done < $outputDir/ReplicateReads_$sample.csv
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
89
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
90 #sum of reads and reads squared
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
91 while IFS=, read readsSum squaredSum
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
92 do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
93 echo "<tr><td>Sum</td><td>$readsSum</td><td>$squaredSum</td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
94 done < $outputDir/ReplicateSumReads_$sample.csv
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
95
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
96 echo "</table></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
97
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
98 #overview
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
99 echo "<tr><td colspan='3'><table border='1'><tr><th>Coincidence Type</th><th>Raw Coincidence Freq</th><th>Coincidence Weight</th><th>Coincidences, Weighted</th></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
100 while IFS=, read type count weight weightedCount
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
101 do
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
102 echo "<tr><td>$type</td><td>$count</td><td>$weight</td><td>$weightedCount</td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
103 done < $outputDir/ClonalityOverView_$sample.csv
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
104 echo "</table></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
105 fi
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
106
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
107 echo "<tr><td><h2>V-D Heatmap:</h2></td><td><h2>V-J Heatmap:</h2></td><td><h2>D-J Heatmap:</h2></td></tr><tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
108 mv "$outputDir/HeatmapVD_$sample.png" "$outputDir/VD_$sample.png"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
109 echo "<td><img src='VD_$sample.png'/></td>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
110 mv "$outputDir/HeatmapVJ_$sample.png" "$outputDir/VJ_$sample.png"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
111 echo "<td><img src='VJ_$sample.png'/></td>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
112 mv "$outputDir/HeatmapDJ_$sample.png" "$outputDir/DJ_$sample.png"
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
113 echo "<td><img src='DJ_$sample.png'/></td></tr>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
114 count=$((count+1))
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
115 done
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
116 echo "</table>" >> $outputFile
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
117
d52f6a986108 Uploaded
davidvanzessen
parents:
diff changeset
118 echo "</html>" >> $outputFile